├── .gitignore ├── README.md ├── pyloom ├── __init__.py ├── __main__.py ├── buckets.py ├── drivers.py ├── entry.py ├── errors.py ├── lua │ ├── bloom_cas.lua │ ├── bloom_check.lua │ ├── url_add.lua │ └── url_pop.lua ├── proxy.py ├── scheduler.py ├── tasks.py ├── user-agent.json ├── utils.py └── worker.py ├── setup.py └── spiders ├── DouBan250 ├── README.md ├── __init__.py └── configs.py ├── DouBanBooks ├── README.md ├── __init__.py ├── configs.py └── tasks.py ├── LaGou ├── README.md ├── __init__.py ├── configs.py └── tasks.py ├── PinDuoDuo ├── README.md ├── __init__.py ├── configs.py └── tasks.py ├── PinDuoDuoWEB ├── README.md ├── __init__.py ├── configs.py ├── get_anticontent.js └── tasks.py ├── WeiBo ├── README.md ├── __init__.py ├── configs.py └── tasks.py └── Ziroom ├── README.md ├── __init__.py ├── configs.py └── tasks.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/README.md -------------------------------------------------------------------------------- /pyloom/__init__.py: -------------------------------------------------------------------------------- 1 | from .tasks import Task 2 | -------------------------------------------------------------------------------- /pyloom/__main__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/__main__.py -------------------------------------------------------------------------------- /pyloom/buckets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/buckets.py -------------------------------------------------------------------------------- /pyloom/drivers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/drivers.py -------------------------------------------------------------------------------- /pyloom/entry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/entry.py -------------------------------------------------------------------------------- /pyloom/errors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/errors.py -------------------------------------------------------------------------------- /pyloom/lua/bloom_cas.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/lua/bloom_cas.lua -------------------------------------------------------------------------------- /pyloom/lua/bloom_check.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/lua/bloom_check.lua -------------------------------------------------------------------------------- /pyloom/lua/url_add.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/lua/url_add.lua -------------------------------------------------------------------------------- /pyloom/lua/url_pop.lua: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/lua/url_pop.lua -------------------------------------------------------------------------------- /pyloom/proxy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/proxy.py -------------------------------------------------------------------------------- /pyloom/scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/scheduler.py -------------------------------------------------------------------------------- /pyloom/tasks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/tasks.py -------------------------------------------------------------------------------- /pyloom/user-agent.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/user-agent.json -------------------------------------------------------------------------------- /pyloom/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/utils.py -------------------------------------------------------------------------------- /pyloom/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/pyloom/worker.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/setup.py -------------------------------------------------------------------------------- /spiders/DouBan250/README.md: -------------------------------------------------------------------------------- 1 | ## 豆瓣TOP250电影爬虫 2 | 3 | 用于演示编写最基本的爬虫、测试新功能。 -------------------------------------------------------------------------------- /spiders/DouBan250/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/DouBan250/__init__.py -------------------------------------------------------------------------------- /spiders/DouBan250/configs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/DouBan250/configs.py -------------------------------------------------------------------------------- /spiders/DouBanBooks/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/DouBanBooks/README.md -------------------------------------------------------------------------------- /spiders/DouBanBooks/__init__.py: -------------------------------------------------------------------------------- 1 | from .tasks import * 2 | -------------------------------------------------------------------------------- /spiders/DouBanBooks/configs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/DouBanBooks/configs.py -------------------------------------------------------------------------------- /spiders/DouBanBooks/tasks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/DouBanBooks/tasks.py -------------------------------------------------------------------------------- /spiders/LaGou/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/LaGou/README.md -------------------------------------------------------------------------------- /spiders/LaGou/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/LaGou/__init__.py -------------------------------------------------------------------------------- /spiders/LaGou/configs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/LaGou/configs.py -------------------------------------------------------------------------------- /spiders/LaGou/tasks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/LaGou/tasks.py -------------------------------------------------------------------------------- /spiders/PinDuoDuo/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/PinDuoDuo/README.md -------------------------------------------------------------------------------- /spiders/PinDuoDuo/__init__.py: -------------------------------------------------------------------------------- 1 | from .tasks import * 2 | -------------------------------------------------------------------------------- /spiders/PinDuoDuo/configs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/PinDuoDuo/configs.py -------------------------------------------------------------------------------- /spiders/PinDuoDuo/tasks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/PinDuoDuo/tasks.py -------------------------------------------------------------------------------- /spiders/PinDuoDuoWEB/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/PinDuoDuoWEB/README.md -------------------------------------------------------------------------------- /spiders/PinDuoDuoWEB/__init__.py: -------------------------------------------------------------------------------- 1 | from .tasks import * -------------------------------------------------------------------------------- /spiders/PinDuoDuoWEB/configs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/PinDuoDuoWEB/configs.py -------------------------------------------------------------------------------- /spiders/PinDuoDuoWEB/get_anticontent.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/PinDuoDuoWEB/get_anticontent.js -------------------------------------------------------------------------------- /spiders/PinDuoDuoWEB/tasks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/PinDuoDuoWEB/tasks.py -------------------------------------------------------------------------------- /spiders/WeiBo/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/WeiBo/README.md -------------------------------------------------------------------------------- /spiders/WeiBo/__init__.py: -------------------------------------------------------------------------------- 1 | from .tasks import * 2 | -------------------------------------------------------------------------------- /spiders/WeiBo/configs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/WeiBo/configs.py -------------------------------------------------------------------------------- /spiders/WeiBo/tasks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/WeiBo/tasks.py -------------------------------------------------------------------------------- /spiders/Ziroom/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/Ziroom/README.md -------------------------------------------------------------------------------- /spiders/Ziroom/__init__.py: -------------------------------------------------------------------------------- 1 | from .tasks import * 2 | -------------------------------------------------------------------------------- /spiders/Ziroom/configs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/Ziroom/configs.py -------------------------------------------------------------------------------- /spiders/Ziroom/tasks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/speng4096/PyLoom/HEAD/spiders/Ziroom/tasks.py --------------------------------------------------------------------------------