系统初始示例
#!/usr/bin/env python # -*- encoding: utf-8 -*- # Created on 2019-11-28 11:25:10 # Project: foodmate
from pyspider.libs.base_handler import *
class Handler(BaseHandler): crawl_config = { }
@every(minutes=24 * 60) def on_start(self): self.crawl('http://down.foodmate.net/standard/sort/1/', callback=self.index_page)
@config(age=10 * 24 * 60 * 60) def index_page(self, response): for each in response.doc('a[href^="http"]').items(): self.crawl(each.attr.href, callback=self.detail_page)
@config(priority=2) def detail_page(self, response): return { "url": response.url, "title": response.doc('title').text(), }
数据库设置