├── images ├── webui.png ├── yara-output.png ├── architecture.png ├── clamav-output.png ├── external_intel.png ├── misp-overview.png ├── payload-output.png ├── sqlite-storage.png ├── console-storage.png └── architecture-prev.png ├── crawler ├── utils │ ├── subcrawl.db │ ├── ansi_colors.py │ ├── __init__.py │ ├── logos │ │ ├── subcrawl-2.txt │ │ ├── subcrawl-3.txt │ │ └── subcrawl-1.txt │ ├── setup_kafka_topic.py │ ├── banner.py │ ├── helpers.py │ ├── sqlite_model.py │ └── logger.py ├── processing │ ├── minisdhash │ │ ├── sdhash │ │ ├── libsdbf.a │ │ └── sdbf_class.py │ ├── default_processing.py │ ├── example_processing.py │ ├── __init__.py │ ├── tlsh_processing.py │ ├── jarm_processing.py │ ├── yara_processing.py │ ├── clamav_processing.py │ ├── sdhash_processing.py │ ├── payload_processing.py │ └── external_intel_processing.py ├── run.sh ├── storage │ ├── __init__.py │ ├── default_storage.py │ ├── example_storage.py │ ├── console_storage.py │ ├── sqlite_storage.py │ ├── elastic_storage.py │ ├── misp_storage.py │ └── kibana-dashboard │ │ └── overview-dashboard.ndjson ├── yara-rules │ ├── open_webshell.yar │ ├── php_file_manager_login.yar │ ├── erbium_discord_panel_login.yar │ ├── default_page_xampp_windows.yar │ ├── default_page_apache.yar │ ├── outlook_phish.yar │ ├── titan_stealer_panel_login.yar │ ├── royalmail_phish.yar │ ├── sharepoint_online_phish.yar │ ├── chase_login_spox_phish.yar │ ├── collector_stealer_panel_login.yar │ ├── bapr_banking_phish.yar │ ├── hex-encoded-pe-file.yar │ ├── microsoft_phish.yar │ ├── aurora_stealer_panel_login.yar │ ├── modernloader_panel_login.yar │ ├── office365_review_phish.yar │ ├── webpanel_origin_login.yar │ ├── base64_pe.yar │ ├── amadey_panel_login.yar │ ├── office365_verify_pdf_phish.yar │ ├── wellsfargo_phish.yar │ ├── bankamerica_phish.yar │ ├── link_sharing_onedrive.yar │ ├── pony_panel_login.yar │ ├── attachments_onedrive_phish.yar │ ├── microsoft_login_phish.yar │ ├── unam_webpanel_login.yar │ ├── sharepoint_dropbox_online_phish.yar │ ├── standard_bank_phish.yar │ ├── onedrive_business_phish.yar │ ├── panels.yar │ ├── h3k_tinyfilemanager_login.yar │ ├── grandamisha_panel_login.yar │ ├── wallet_connect_phish.yar │ ├── obfuscated_script.yar │ ├── acridrain_stealer_panel_login.yar │ ├── mars_panel_login.yar │ ├── huntington_phish.yar │ ├── mana5_panel_login.yar │ ├── base64_shellcode_dos_header_pe.yar │ ├── html_webshell_login.yar │ ├── php_webshell_backend.yar │ ├── agenttesla_webpanel_login.yar │ ├── js_webshell_tracking_script.yar │ └── combined-rules.yar ├── requirements.txt ├── Dockerfile ├── docker-compose.yml ├── app │ ├── templates │ │ ├── domains.html │ │ ├── urls.html │ │ ├── search_results.html │ │ ├── dashboard.html │ │ ├── url_details.html │ │ ├── domain_details.html │ │ └── base.html │ └── main.py ├── service.py ├── input │ ├── phishtank.py │ └── urlhaus.py ├── misp-objects │ └── opendir-url │ │ └── definition.json ├── supervisor │ └── supervisord.conf ├── config.yml └── subcrawl.py ├── conferences └── 2021 │ └── blackhat_us_arsenal │ └── BH-Arsenal-2021.pdf ├── License.md ├── .gitignore └── README.md /images/webui.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/images/webui.png -------------------------------------------------------------------------------- /images/yara-output.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/images/yara-output.png -------------------------------------------------------------------------------- /crawler/utils/subcrawl.db: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/crawler/utils/subcrawl.db -------------------------------------------------------------------------------- /images/architecture.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/images/architecture.png -------------------------------------------------------------------------------- /images/clamav-output.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/images/clamav-output.png -------------------------------------------------------------------------------- /images/external_intel.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/images/external_intel.png -------------------------------------------------------------------------------- /images/misp-overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/images/misp-overview.png -------------------------------------------------------------------------------- /images/payload-output.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/images/payload-output.png -------------------------------------------------------------------------------- /images/sqlite-storage.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/images/sqlite-storage.png -------------------------------------------------------------------------------- /images/console-storage.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/images/console-storage.png -------------------------------------------------------------------------------- /images/architecture-prev.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/images/architecture-prev.png -------------------------------------------------------------------------------- /crawler/processing/minisdhash/sdhash: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/crawler/processing/minisdhash/sdhash -------------------------------------------------------------------------------- /crawler/processing/minisdhash/libsdbf.a: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/crawler/processing/minisdhash/libsdbf.a -------------------------------------------------------------------------------- /crawler/run.sh: -------------------------------------------------------------------------------- 1 | service clamav-daemon start 2 | service supervisor start 3 | gunicorn app.main:app -b 0.0.0.0:8000 --reload --workers 4 -------------------------------------------------------------------------------- /conferences/2021/blackhat_us_arsenal/BH-Arsenal-2021.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jstrosch/subcrawl/HEAD/conferences/2021/blackhat_us_arsenal/BH-Arsenal-2021.pdf -------------------------------------------------------------------------------- /crawler/storage/__init__.py: -------------------------------------------------------------------------------- 1 | # © Copyright 2021 HP Development Company, L.P. 2 | from .console_storage import ConsoleStorage 3 | from .misp_storage import MISPStorage 4 | from .sqlite_storage import SqliteStorage 5 | from .elastic_storage import ElasticStorage 6 | -------------------------------------------------------------------------------- /crawler/utils/ansi_colors.py: -------------------------------------------------------------------------------- 1 | # © Copyright 2021 HP Development Company, L.P. 2 | 3 | class SubCrawlColors: 4 | BLUE = '\033[34m' 5 | GREEN = '\033[32m' 6 | PURPLE = '\033[35m' 7 | YELLOW = '\033[33m' 8 | RED = '\033[31m' 9 | CYAN = '\033[36m' 10 | RESET = '\033[0m' 11 | CLS = '\033[2J' 12 | -------------------------------------------------------------------------------- /crawler/yara-rules/open_webshell.yar: -------------------------------------------------------------------------------- 1 | rule open_webshell 2 | { 3 | meta: 4 | description = "Open Webshell Detection" 5 | author = "patrick.schlapfer@hp.com" 6 | date = "2021-04-19" 7 | 8 | strings: 9 | $a = "file manager" 10 | $b = "uname" 11 | 12 | condition: 13 | all of them 14 | } 15 | -------------------------------------------------------------------------------- /crawler/yara-rules/php_file_manager_login.yar: -------------------------------------------------------------------------------- 1 | rule php_file_manager_login { 2 | 3 | meta: 4 | date = "2022-11-29" 5 | 6 | strings: 7 | $s1 = "