├── .gitignore ├── ChangeLog.md ├── LICENSE ├── README.md ├── docs ├── English.md ├── Franch.md ├── German.md ├── Italian.md ├── Japanese.md ├── Korean.md ├── Russian.md └── Spanish.md ├── pom.xml ├── seimicrawler ├── pom.xml └── src │ ├── main │ ├── java │ │ └── cn │ │ │ └── wanghaomiao │ │ │ └── seimi │ │ │ ├── Constants.java │ │ │ ├── annotation │ │ │ ├── Crawler.java │ │ │ ├── EnableSeimiCrawler.java │ │ │ ├── Interceptor.java │ │ │ ├── Queue.java │ │ │ ├── Xpath.java │ │ │ └── validate │ │ │ │ └── NotNull.java │ │ │ ├── boot │ │ │ └── Run.java │ │ │ ├── config │ │ │ └── SeimiConfig.java │ │ │ ├── core │ │ │ ├── CastToNumber.java │ │ │ ├── Seimi.java │ │ │ ├── SeimiContext.java │ │ │ ├── SeimiCrawler.java │ │ │ ├── SeimiDefScanConfig.java │ │ │ ├── SeimiDownloader.java │ │ │ ├── SeimiInterceptor.java │ │ │ ├── SeimiProcessor.java │ │ │ └── SeimiQueue.java │ │ │ ├── def │ │ │ ├── BaseSeimiCrawler.java │ │ │ ├── DefaultLocalQueue.java │ │ │ └── DefaultRedisQueue.java │ │ │ ├── exception │ │ │ ├── SeimiBeanResolveException.java │ │ │ ├── SeimiInitExcepiton.java │ │ │ └── SeimiProcessExcepiton.java │ │ │ ├── http │ │ │ ├── HttpMethod.java │ │ │ ├── SeimiAgentContentType.java │ │ │ ├── SeimiCookie.java │ │ │ ├── SeimiHttpType.java │ │ │ ├── hc │ │ │ │ ├── HcDownloader.java │ │ │ │ ├── HcRequestGenerator.java │ │ │ │ ├── HttpClientCMPBox.java │ │ │ │ ├── HttpClientConnectionManagerProvider.java │ │ │ │ ├── HttpClientFactory.java │ │ │ │ └── SeimiRedirectStrategy.java │ │ │ └── okhttp │ │ │ │ ├── CookiesManager.java │ │ │ │ ├── OkHttpClientBuilderBox.java │ │ │ │ ├── OkHttpClientBuilderProvider.java │ │ │ │ ├── OkHttpDownloader.java │ │ │ │ └── OkHttpRequestGenerator.java │ │ │ ├── httpd │ │ │ ├── CrawlerStatusHttpProcessor.java │ │ │ ├── HttpRequestProcessor.java │ │ │ ├── PushRequestHttpProcessor.java │ │ │ └── SeimiHttpHandler.java │ │ │ ├── spring │ │ │ ├── boot │ │ │ │ ├── CrawlerProperties.java │ │ │ │ ├── SeimiCrawlerAutoConfiguration.java │ │ │ │ └── SeimiCrawlerBeanRegistar.java │ │ │ └── common │ │ │ │ ├── CrawlerCache.java │ │ │ │ ├── SeimiCrawlerBaseConfig.java │ │ │ │ ├── SeimiCrawlerBeanPostProcessor.java │ │ │ │ ├── SeimiCrawlerBootstrapListener.java │ │ │ │ └── StandaloneCondition.java │ │ │ ├── struct │ │ │ ├── BodyType.java │ │ │ ├── CommonObject.java │ │ │ ├── CrawlerModel.java │ │ │ ├── Request.java │ │ │ └── Response.java │ │ │ └── utils │ │ │ ├── ClazzUtils.java │ │ │ ├── GenericUtils.java │ │ │ ├── StrFormatUtil.java │ │ │ ├── StructValidator.java │ │ │ └── SysEnvUtil.java │ └── resources │ │ └── META-INF │ │ └── spring.factories │ └── test │ └── java │ └── cn │ └── wanghaomiao │ └── seimi │ └── utils │ └── StrFormatUtilTest.java ├── spring-boot-example ├── pom.xml └── src │ └── main │ ├── java │ └── cn │ │ └── wanghaomiao │ │ └── seimi │ │ ├── SeimiCrawlerApplication.java │ │ ├── controller │ │ └── IndexController.java │ │ └── crawlers │ │ ├── Basic.java │ │ └── DefaultRedisQueueEG.java │ └── resources │ ├── application.properties │ └── seimi-app.xml └── standalone-example ├── pom.xml └── src ├── main ├── java │ └── cn │ │ └── wanghaomiao │ │ ├── annotations │ │ └── DoLog.java │ │ ├── crawlers │ │ ├── Basic.java │ │ ├── BasicWithScheduler.java │ │ ├── DatabaseMybatisDemo.java │ │ ├── DefaultRedisQueueEG.java │ │ ├── DynamicUserAgent.java │ │ ├── IntercepterDemo.java │ │ ├── JDWalker.java │ │ ├── MutiPageNewsCrawler.java │ │ ├── SeimiAgentDemo.java │ │ ├── StoreInFile.java │ │ ├── UseBeanResolver.java │ │ ├── UseCookie.java │ │ ├── UseDelay.java │ │ ├── UseDynamicProxy.java │ │ └── UseProxy.java │ │ ├── dao │ │ └── mybatis │ │ │ └── MybatisStoreDAO.java │ │ ├── interceptors │ │ └── DemoInterceptor.java │ │ ├── main │ │ ├── Boot.java │ │ └── StartWorkers.java │ │ └── model │ │ └── BlogContent.java └── resources │ ├── config │ ├── db_demo.sql │ └── seimi.properties │ ├── logback.xml │ ├── mybatis-config.xml │ ├── seimi-mybatis.xml │ └── seimi.xml └── test └── java └── cn └── wanghaomiao └── main └── RunTest.java /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/.gitignore -------------------------------------------------------------------------------- /ChangeLog.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/ChangeLog.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/README.md -------------------------------------------------------------------------------- /docs/English.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/docs/English.md -------------------------------------------------------------------------------- /docs/Franch.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/docs/Franch.md -------------------------------------------------------------------------------- /docs/German.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/docs/German.md -------------------------------------------------------------------------------- /docs/Italian.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/docs/Italian.md -------------------------------------------------------------------------------- /docs/Japanese.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/docs/Japanese.md -------------------------------------------------------------------------------- /docs/Korean.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/docs/Korean.md -------------------------------------------------------------------------------- /docs/Russian.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/docs/Russian.md -------------------------------------------------------------------------------- /docs/Spanish.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/docs/Spanish.md -------------------------------------------------------------------------------- /pom.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/pom.xml -------------------------------------------------------------------------------- /seimicrawler/pom.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/pom.xml -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/Constants.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/Constants.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/Crawler.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/Crawler.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/EnableSeimiCrawler.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/EnableSeimiCrawler.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/Interceptor.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/Interceptor.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/Queue.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/Queue.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/Xpath.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/Xpath.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/validate/NotNull.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/annotation/validate/NotNull.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/boot/Run.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/boot/Run.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/config/SeimiConfig.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/config/SeimiConfig.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/CastToNumber.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/CastToNumber.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/Seimi.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/Seimi.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiContext.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiContext.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiCrawler.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiCrawler.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiDefScanConfig.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiDefScanConfig.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiDownloader.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiDownloader.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiInterceptor.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiInterceptor.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiProcessor.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiProcessor.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiQueue.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/core/SeimiQueue.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/def/BaseSeimiCrawler.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/def/BaseSeimiCrawler.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/def/DefaultLocalQueue.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/def/DefaultLocalQueue.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/def/DefaultRedisQueue.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/def/DefaultRedisQueue.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/exception/SeimiBeanResolveException.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/exception/SeimiBeanResolveException.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/exception/SeimiInitExcepiton.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/exception/SeimiInitExcepiton.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/exception/SeimiProcessExcepiton.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/exception/SeimiProcessExcepiton.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/HttpMethod.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/HttpMethod.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/SeimiAgentContentType.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/SeimiAgentContentType.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/SeimiCookie.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/SeimiCookie.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/SeimiHttpType.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/SeimiHttpType.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/HcDownloader.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/HcDownloader.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/HcRequestGenerator.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/HcRequestGenerator.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/HttpClientCMPBox.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/HttpClientCMPBox.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/HttpClientConnectionManagerProvider.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/HttpClientConnectionManagerProvider.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/HttpClientFactory.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/HttpClientFactory.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/SeimiRedirectStrategy.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/hc/SeimiRedirectStrategy.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/okhttp/CookiesManager.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/okhttp/CookiesManager.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/okhttp/OkHttpClientBuilderBox.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/okhttp/OkHttpClientBuilderBox.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/okhttp/OkHttpClientBuilderProvider.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/okhttp/OkHttpClientBuilderProvider.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/okhttp/OkHttpDownloader.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/okhttp/OkHttpDownloader.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/okhttp/OkHttpRequestGenerator.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/http/okhttp/OkHttpRequestGenerator.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/httpd/CrawlerStatusHttpProcessor.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/httpd/CrawlerStatusHttpProcessor.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/httpd/HttpRequestProcessor.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/httpd/HttpRequestProcessor.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/httpd/PushRequestHttpProcessor.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/httpd/PushRequestHttpProcessor.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/httpd/SeimiHttpHandler.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/httpd/SeimiHttpHandler.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/boot/CrawlerProperties.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/boot/CrawlerProperties.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/boot/SeimiCrawlerAutoConfiguration.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/boot/SeimiCrawlerAutoConfiguration.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/boot/SeimiCrawlerBeanRegistar.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/boot/SeimiCrawlerBeanRegistar.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/common/CrawlerCache.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/common/CrawlerCache.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/common/SeimiCrawlerBaseConfig.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/common/SeimiCrawlerBaseConfig.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/common/SeimiCrawlerBeanPostProcessor.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/common/SeimiCrawlerBeanPostProcessor.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/common/SeimiCrawlerBootstrapListener.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/common/SeimiCrawlerBootstrapListener.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/common/StandaloneCondition.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/spring/common/StandaloneCondition.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/struct/BodyType.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/struct/BodyType.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/struct/CommonObject.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/struct/CommonObject.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/struct/CrawlerModel.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/struct/CrawlerModel.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/struct/Request.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/struct/Request.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/struct/Response.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/struct/Response.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/utils/ClazzUtils.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/utils/ClazzUtils.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/utils/GenericUtils.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/utils/GenericUtils.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/utils/StrFormatUtil.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/utils/StrFormatUtil.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/utils/StructValidator.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/utils/StructValidator.java -------------------------------------------------------------------------------- /seimicrawler/src/main/java/cn/wanghaomiao/seimi/utils/SysEnvUtil.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/java/cn/wanghaomiao/seimi/utils/SysEnvUtil.java -------------------------------------------------------------------------------- /seimicrawler/src/main/resources/META-INF/spring.factories: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/main/resources/META-INF/spring.factories -------------------------------------------------------------------------------- /seimicrawler/src/test/java/cn/wanghaomiao/seimi/utils/StrFormatUtilTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/seimicrawler/src/test/java/cn/wanghaomiao/seimi/utils/StrFormatUtilTest.java -------------------------------------------------------------------------------- /spring-boot-example/pom.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/spring-boot-example/pom.xml -------------------------------------------------------------------------------- /spring-boot-example/src/main/java/cn/wanghaomiao/seimi/SeimiCrawlerApplication.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/spring-boot-example/src/main/java/cn/wanghaomiao/seimi/SeimiCrawlerApplication.java -------------------------------------------------------------------------------- /spring-boot-example/src/main/java/cn/wanghaomiao/seimi/controller/IndexController.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/spring-boot-example/src/main/java/cn/wanghaomiao/seimi/controller/IndexController.java -------------------------------------------------------------------------------- /spring-boot-example/src/main/java/cn/wanghaomiao/seimi/crawlers/Basic.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/spring-boot-example/src/main/java/cn/wanghaomiao/seimi/crawlers/Basic.java -------------------------------------------------------------------------------- /spring-boot-example/src/main/java/cn/wanghaomiao/seimi/crawlers/DefaultRedisQueueEG.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/spring-boot-example/src/main/java/cn/wanghaomiao/seimi/crawlers/DefaultRedisQueueEG.java -------------------------------------------------------------------------------- /spring-boot-example/src/main/resources/application.properties: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/spring-boot-example/src/main/resources/application.properties -------------------------------------------------------------------------------- /spring-boot-example/src/main/resources/seimi-app.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/spring-boot-example/src/main/resources/seimi-app.xml -------------------------------------------------------------------------------- /standalone-example/pom.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/pom.xml -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/annotations/DoLog.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/annotations/DoLog.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/Basic.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/Basic.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/BasicWithScheduler.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/BasicWithScheduler.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/DatabaseMybatisDemo.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/DatabaseMybatisDemo.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/DefaultRedisQueueEG.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/DefaultRedisQueueEG.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/DynamicUserAgent.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/DynamicUserAgent.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/IntercepterDemo.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/IntercepterDemo.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/JDWalker.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/JDWalker.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/MutiPageNewsCrawler.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/MutiPageNewsCrawler.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/SeimiAgentDemo.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/SeimiAgentDemo.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/StoreInFile.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/StoreInFile.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/UseBeanResolver.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/UseBeanResolver.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/UseCookie.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/UseCookie.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/UseDelay.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/UseDelay.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/UseDynamicProxy.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/UseDynamicProxy.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/crawlers/UseProxy.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/crawlers/UseProxy.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/dao/mybatis/MybatisStoreDAO.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/dao/mybatis/MybatisStoreDAO.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/interceptors/DemoInterceptor.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/interceptors/DemoInterceptor.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/main/Boot.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/main/Boot.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/main/StartWorkers.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/main/StartWorkers.java -------------------------------------------------------------------------------- /standalone-example/src/main/java/cn/wanghaomiao/model/BlogContent.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/java/cn/wanghaomiao/model/BlogContent.java -------------------------------------------------------------------------------- /standalone-example/src/main/resources/config/db_demo.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/resources/config/db_demo.sql -------------------------------------------------------------------------------- /standalone-example/src/main/resources/config/seimi.properties: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/resources/config/seimi.properties -------------------------------------------------------------------------------- /standalone-example/src/main/resources/logback.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/resources/logback.xml -------------------------------------------------------------------------------- /standalone-example/src/main/resources/mybatis-config.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/resources/mybatis-config.xml -------------------------------------------------------------------------------- /standalone-example/src/main/resources/seimi-mybatis.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/resources/seimi-mybatis.xml -------------------------------------------------------------------------------- /standalone-example/src/main/resources/seimi.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/main/resources/seimi.xml -------------------------------------------------------------------------------- /standalone-example/src/test/java/cn/wanghaomiao/main/RunTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhegexiaohuozi/SeimiCrawler/HEAD/standalone-example/src/test/java/cn/wanghaomiao/main/RunTest.java --------------------------------------------------------------------------------