├── .idea ├── dianping_data.iml ├── misc.xml ├── modules.xml ├── vcs.xml └── workspace.xml ├── README.md ├── anjuke ├── README.md ├── anjuke │ ├── __init__.py │ ├── __init__.pyc │ ├── items.py │ ├── items.pyc │ ├── middlewares.py │ ├── middlewares.pyc │ ├── pipelines.py │ ├── settings.py │ ├── settings.pyc │ └── spiders │ │ ├── __init__.py │ │ ├── __init__.pyc │ │ ├── anjuke_spider.py │ │ └── anjuke_spider.pyc └── scrapy.cfg ├── book_rank ├── .idea │ ├── book_rank.iml │ ├── encodings.xml │ ├── misc.xml │ ├── modules.xml │ └── workspace.xml ├── book_rank │ ├── __init__.py │ ├── __init__.pyc │ ├── items.py │ ├── items.pyc │ ├── pipelines.py │ ├── run.py │ ├── settings.py │ ├── settings.pyc │ └── spiders │ │ ├── __init__.py │ │ ├── __init__.pyc │ │ ├── bookspider.py │ │ └── bookspider.pyc ├── issue.txt └── scrapy.cfg ├── img_recognize ├── captcha-1.jpg ├── captcha-2.jpg └── readme.txt └── love_food ├── .DS_Store ├── .idea ├── love_food.iml ├── misc.xml ├── modules.xml ├── vcs.xml └── workspace.xml ├── love_food ├── .DS_Store ├── __init__.py ├── __init__.pyc ├── items.py ├── items.pyc ├── middlewares.py ├── middlewares.pyc ├── pipelines.py ├── pipelines.pyc ├── settings.py ├── settings.pyc └── spiders │ ├── __init__.py │ ├── __init__.pyc │ ├── foodspider.py │ └── foodspider.pyc └── scrapy.cfg /.idea/dianping_data.iml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/.idea/dianping_data.iml -------------------------------------------------------------------------------- /.idea/misc.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/.idea/misc.xml -------------------------------------------------------------------------------- /.idea/modules.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/.idea/modules.xml -------------------------------------------------------------------------------- /.idea/vcs.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/.idea/vcs.xml -------------------------------------------------------------------------------- /.idea/workspace.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/.idea/workspace.xml -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/README.md -------------------------------------------------------------------------------- /anjuke/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/README.md -------------------------------------------------------------------------------- /anjuke/anjuke/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /anjuke/anjuke/__init__.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/__init__.pyc -------------------------------------------------------------------------------- /anjuke/anjuke/items.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/items.py -------------------------------------------------------------------------------- /anjuke/anjuke/items.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/items.pyc -------------------------------------------------------------------------------- /anjuke/anjuke/middlewares.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/middlewares.py -------------------------------------------------------------------------------- /anjuke/anjuke/middlewares.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/middlewares.pyc -------------------------------------------------------------------------------- /anjuke/anjuke/pipelines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/pipelines.py -------------------------------------------------------------------------------- /anjuke/anjuke/settings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/settings.py -------------------------------------------------------------------------------- /anjuke/anjuke/settings.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/settings.pyc -------------------------------------------------------------------------------- /anjuke/anjuke/spiders/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/spiders/__init__.py -------------------------------------------------------------------------------- /anjuke/anjuke/spiders/__init__.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/spiders/__init__.pyc -------------------------------------------------------------------------------- /anjuke/anjuke/spiders/anjuke_spider.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/spiders/anjuke_spider.py -------------------------------------------------------------------------------- /anjuke/anjuke/spiders/anjuke_spider.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/anjuke/spiders/anjuke_spider.pyc -------------------------------------------------------------------------------- /anjuke/scrapy.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/anjuke/scrapy.cfg -------------------------------------------------------------------------------- /book_rank/.idea/book_rank.iml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/.idea/book_rank.iml -------------------------------------------------------------------------------- /book_rank/.idea/encodings.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/.idea/encodings.xml -------------------------------------------------------------------------------- /book_rank/.idea/misc.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/.idea/misc.xml -------------------------------------------------------------------------------- /book_rank/.idea/modules.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/.idea/modules.xml -------------------------------------------------------------------------------- /book_rank/.idea/workspace.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/.idea/workspace.xml -------------------------------------------------------------------------------- /book_rank/book_rank/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /book_rank/book_rank/__init__.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/__init__.pyc -------------------------------------------------------------------------------- /book_rank/book_rank/items.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/items.py -------------------------------------------------------------------------------- /book_rank/book_rank/items.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/items.pyc -------------------------------------------------------------------------------- /book_rank/book_rank/pipelines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/pipelines.py -------------------------------------------------------------------------------- /book_rank/book_rank/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/run.py -------------------------------------------------------------------------------- /book_rank/book_rank/settings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/settings.py -------------------------------------------------------------------------------- /book_rank/book_rank/settings.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/settings.pyc -------------------------------------------------------------------------------- /book_rank/book_rank/spiders/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/spiders/__init__.py -------------------------------------------------------------------------------- /book_rank/book_rank/spiders/__init__.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/spiders/__init__.pyc -------------------------------------------------------------------------------- /book_rank/book_rank/spiders/bookspider.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/spiders/bookspider.py -------------------------------------------------------------------------------- /book_rank/book_rank/spiders/bookspider.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/book_rank/spiders/bookspider.pyc -------------------------------------------------------------------------------- /book_rank/issue.txt: -------------------------------------------------------------------------------- 1 | 忽略tbody,否则xpath正确,依然没数据 -------------------------------------------------------------------------------- /book_rank/scrapy.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/book_rank/scrapy.cfg -------------------------------------------------------------------------------- /img_recognize/captcha-1.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/img_recognize/captcha-1.jpg -------------------------------------------------------------------------------- /img_recognize/captcha-2.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/img_recognize/captcha-2.jpg -------------------------------------------------------------------------------- /img_recognize/readme.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/img_recognize/readme.txt -------------------------------------------------------------------------------- /love_food/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/.DS_Store -------------------------------------------------------------------------------- /love_food/.idea/love_food.iml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/.idea/love_food.iml -------------------------------------------------------------------------------- /love_food/.idea/misc.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/.idea/misc.xml -------------------------------------------------------------------------------- /love_food/.idea/modules.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/.idea/modules.xml -------------------------------------------------------------------------------- /love_food/.idea/vcs.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/.idea/vcs.xml -------------------------------------------------------------------------------- /love_food/.idea/workspace.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/.idea/workspace.xml -------------------------------------------------------------------------------- /love_food/love_food/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/.DS_Store -------------------------------------------------------------------------------- /love_food/love_food/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /love_food/love_food/__init__.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/__init__.pyc -------------------------------------------------------------------------------- /love_food/love_food/items.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/items.py -------------------------------------------------------------------------------- /love_food/love_food/items.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/items.pyc -------------------------------------------------------------------------------- /love_food/love_food/middlewares.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/middlewares.py -------------------------------------------------------------------------------- /love_food/love_food/middlewares.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/middlewares.pyc -------------------------------------------------------------------------------- /love_food/love_food/pipelines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/pipelines.py -------------------------------------------------------------------------------- /love_food/love_food/pipelines.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/pipelines.pyc -------------------------------------------------------------------------------- /love_food/love_food/settings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/settings.py -------------------------------------------------------------------------------- /love_food/love_food/settings.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/settings.pyc -------------------------------------------------------------------------------- /love_food/love_food/spiders/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/spiders/__init__.py -------------------------------------------------------------------------------- /love_food/love_food/spiders/__init__.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/spiders/__init__.pyc -------------------------------------------------------------------------------- /love_food/love_food/spiders/foodspider.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/spiders/foodspider.py -------------------------------------------------------------------------------- /love_food/love_food/spiders/foodspider.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/love_food/spiders/foodspider.pyc -------------------------------------------------------------------------------- /love_food/scrapy.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PyCN/dianping_data/HEAD/love_food/scrapy.cfg --------------------------------------------------------------------------------