├── .gitignore
├── LICENSE
├── README.md
├── firmanalyzer
    ├── CVEsearch.py
    ├── Examples
    │   ├── buffalo
    │   │   ├── explore.log
    │   │   ├── report.txt
    │   │   └── summary.txt
    │   ├── dap-3662.log
    │   ├── dlink
    │   │   ├── DAP-2690_REVB_FIRMWARE_3.16.RC100_WW
    │   │   │   ├── report.txt
    │   │   │   └── summary.txt
    │   │   └── DAP-3662
    │   │   │   ├── dap-3662.log
    │   │   │   ├── report.txt
    │   │   │   ├── summary.txt
    │   │   │   └── token_usage.jsonl
    │   ├── explore.log
    │   ├── mikrotik
    │   │   ├── routeros-7.5-mipsbe
    │   │   │   ├── report.txt
    │   │   │   ├── summary.txt
    │   │   │   └── token_usage.jsonl
    │   │   └── routeros-x86-6.49.6
    │   │   │   ├── report.txt
    │   │   │   ├── summary.txt
    │   │   │   └── token_usage.jsonl
    │   ├── openwrt
    │   │   ├── fbecd0858ac36049e04bf9dd8acd3dd53fed97b4
    │   │   │   ├── report.txt
    │   │   │   ├── summary.txt
    │   │   │   └── token_usage.jsonl
    │   │   └── openwrtSample
    │   │   │   ├── report.txt
    │   │   │   └── summary.txt
    │   ├── summary_example.md
    │   ├── tp-link
    │   │   └── TL-IPC55x_P_-x_2.0
    │   │   │   ├── report.txt
    │   │   │   └── summary.txt
    │   └── ui
    │   │   ├── Ubiquiti 4.3.22.11330
    │   │       ├── report.txt
    │   │       └── summary.txt
    │   │   └── Ubiquiti Linux-2.6.32.71
    │   │       ├── report.txt
    │   │       └── summary
    ├── LogManage.py
    ├── R2decetor.py
    ├── README.md
    ├── analyze.py
    ├── callback.py
    ├── client.py
    ├── disassembly.py
    ├── explore.py
    ├── llm_config.py
    ├── requirements.yaml
    ├── run.py
    ├── securityscan.py
    ├── tools.py
    └── utils.py
└── firmcrawler
    ├── Examples
        ├── dlink
        │   ├── navigation_links.jsonl
        │   ├── screenshot_1.png
        │   ├── screenshot_2.png
        │   ├── screenshot_3.png
        │   ├── screenshot_4.png
        │   └── screenshot_5.png
        ├── openwrt
        │   ├── screenshot_1.png
        │   ├── screenshot_2.png
        │   ├── screenshot_3.png
        │   ├── screenshot_4.png
        │   └── screenshot_5.png
        ├── tp-link
        │   ├── navigation_links.jsonl
        │   ├── screenshot_1.png
        │   ├── screenshot_2.png
        │   ├── screenshot_3.png
        │   ├── screenshot_4.png
        │   └── screenshot_5.png
        ├── ui
        │   ├── navigation_links.jsonl
        │   ├── screenshot_1.png
        │   ├── screenshot_2.png
        │   ├── screenshot_3.png
        │   ├── screenshot_4.png
        │   └── screenshot_5.png
        └── zyxel
        │   ├── navigation_links.jsonl
        │   ├── screenshot_1.png
        │   ├── screenshot_2.png
        │   ├── screenshot_3.png
        │   ├── screenshot_4.png
        │   └── screenshot_5.png
    ├── README.md
    ├── callback.py
    ├── crawler.py
    ├── mark_page.js
    ├── prompts
        ├── base.yaml
        ├── dlink.yaml
        ├── foscam.yaml
        └── ui.yaml
    ├── run.py
    └── web_intrect.py


/.gitignore:
--------------------------------------------------------------------------------
1 | *.ini
2 | __pycache__/
3 | *.py[cod]
4 | *$py.class
5 | firmanalyzer/result/
6 | .idea/
7 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
  1 |                                  Apache License
  2 |                            Version 2.0, January 2004
  3 |                         http://www.apache.org/licenses/
  4 | 
  5 |    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
  6 | 
  7 |    1. Definitions.
  8 | 
  9 |       "License" shall mean the terms and conditions for use, reproduction,
 10 |       and distribution as defined by Sections 1 through 10 of this document.
 11 | 
 12 |       "Licensor" shall mean the copyright owner or entity authorized by
 13 |       the copyright owner that is granting the License.
 14 | 
 15 |       "Legal Entity" shall mean the union of the acting entity and all
 16 |       other entities that control, are controlled by, or are under common
 17 |       control with that entity. For the purposes of this definition,
 18 |       "control" means (i) the power, direct or indirect, to cause the
 19 |       direction or management of such entity, whether by contract or
 20 |       otherwise, or (ii) ownership of fifty percent (50%) or more of the
 21 |       outstanding shares, or (iii) beneficial ownership of such entity.
 22 | 
 23 |       "You" (or "Your") shall mean an individual or Legal Entity
 24 |       exercising permissions granted by this License.
 25 | 
 26 |       "Source" form shall mean the preferred form for making modifications,
 27 |       including but not limited to software source code, documentation
 28 |       source, and configuration files.
 29 | 
 30 |       "Object" form shall mean any form resulting from mechanical
 31 |       transformation or translation of a Source form, including but
 32 |       not limited to compiled object code, generated documentation,
 33 |       and conversions to other media types.
 34 | 
 35 |       "Work" shall mean the work of authorship, whether in Source or
 36 |       Object form, made available under the License, as indicated by a
 37 |       copyright notice that is included in or attached to the work
 38 |       (an example is provided in the Appendix below).
 39 | 
 40 |       "Derivative Works" shall mean any work, whether in Source or Object
 41 |       form, that is based on (or derived from) the Work and for which the
 42 |       editorial revisions, annotations, elaborations, or other modifications
 43 |       represent, as a whole, an original work of authorship. For the purposes
 44 |       of this License, Derivative Works shall not include works that remain
 45 |       separable from, or merely link (or bind by name) to the interfaces of,
 46 |       the Work and Derivative Works thereof.
 47 | 
 48 |       "Contribution" shall mean any work of authorship, including
 49 |       the original version of the Work and any modifications or additions
 50 |       to that Work or Derivative Works thereof, that is intentionally
 51 |       submitted to Licensor for inclusion in the Work by the copyright owner
 52 |       or by an individual or Legal Entity authorized to submit on behalf of
 53 |       the copyright owner.
 54 | 
 55 |       "Contributor" shall mean Licensor and any individual or Legal Entity
 56 |       on behalf of whom a Contribution has been received by Licensor and
 57 |       subsequently incorporated within the Work.
 58 | 
 59 |    2. Grant of Copyright License...
 60 | 
 61 |    3. Grant of Patent License...
 62 | 
 63 |    4. Redistribution...
 64 | 
 65 |    5. Submission of Contributions...
 66 | 
 67 |    6. Trademarks...
 68 | 
 69 |    7. Disclaimer of Warranty...
 70 | 
 71 |    8. Limitation of Liability...
 72 | 
 73 |    9. Accepting Warranty or Additional Liability...
 74 | 
 75 |    10. Additional Terms by Licensor Zhang Xiangrui:
 76 | 
 77 |        a) The Work and Derivative Works may be used for **academic and
 78 |           non-commercial research purposes only**.
 79 | 
 80 |        b) Any form of **commercial use** (including but not limited to:
 81 |           integration into commercial products, providing commercial
 82 |           services, SaaS platforms, or generating revenue through the
 83 |           Work or Derivative Works) is **prohibited without explicit,
 84 |           written permission** from the Licensor.
 85 | 
 86 |        c) If You produce academic papers, tools, or software based on or
 87 |           using the Work or its Derivative Works, **you must also release
 88 |           those related codes under an open-source license** that is
 89 |           compatible with the Apache License, Version 2.0.
 90 | 
 91 |        d) You must properly attribute the original author(s) in any public
 92 |           or published work that uses or builds upon this Work.
 93 | 
 94 |    END OF TERMS AND CONDITIONS
 95 | 
 96 |    APPENDIX: How to apply the Apache License to your work.
 97 | 
 98 |       To apply the Apache License to your work, attach the following
 99 |       boilerplate notice, with the fields enclosed by brackets "[]"
100 |       replaced with your own identifying information.
101 | 
102 |    Copyright 2025 Zhang Xiangrui
103 | 
104 |    Licensed under the Apache License, Version 2.0 (the "License");
105 |    you may not use this file except in compliance with the License.
106 |    You may obtain a copy of the License at
107 | 
108 |        http://www.apache.org/licenses/LICENSE-2.0
109 | 
110 |    Unless required by applicable law or agreed to in writing, software
111 |    distributed under the License is distributed on an "AS IS" BASIS,
112 |    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
113 |    See the License for the specific language governing permissions and
114 |    limitations under the License.
115 | 
116 |    Additional Restrictions:
117 |    - For academic use only.
118 |    - Commercial use is prohibited without permission.
119 |    - Research results based on this code must also be open-sourced.
120 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | # FirmLLM
  2 | 
  3 | A Multi-Agent System for Large-Scale Firmware Collection and Analysis Based on Large Language Models
  4 | 
  5 | FirmLLM is designed to **automate long-cycle analysis tasks** by leveraging multi-agent collaboration and LLMs, enabling scalable and intelligent firmware collection and vulnerability analysis.  It aims to **reduce the manual burden on security analysts** by streamlining and accelerating complex firmware security workflows.
  6 | 
  7 | ---
  8 | 
  9 | ## Overview
 10 | 
 11 | **FirmLLM** is an integrated system for large-scale firmware acquisition and security analysis. It leverages multi-agent collaboration and large language models (LLMs) to achieve intelligent automation in both crawling and analysis.
 12 | 
 13 | The system consists of two main modules:
 14 | 
 15 | - **FirmCrawler**: A multi-agent web crawler for automated firmware collection from online sources
 16 | - **FirmAnalyzer**: A firmware security analysis engine that combines static tools and LLM capabilities
 17 | 
 18 | ---
 19 | 
 20 | ## 📁 Project Structure
 21 | 
 22 | ```
 23 | .
 24 | ├── firmcrawler/       # Firmware Collection System
 25 | ├── firmanalyzer/      # Firmware Analysis System
 26 | └── Examples/   # Analysis Result Samples
 27 | ```
 28 | 
 29 | ---
 30 | 
 31 | ## 🕸️ Firmware Collection System (FirmCrawler)
 32 | 
 33 | **FirmCrawler** is used for automated collection of firmware files from various manufacturers. The system is built upon and optimized from [WebVoyager](https://langchain-ai.github.io/langgraph/tutorials/web-navigation/web_voyager/) [[paper]](https://arxiv.org/abs/2401.13919), implementing a multi-agent collaboration system for large-scale firmware collection. 
 34 | WebVoyager is an innovative Large Multimodal Model (LMM) powered web agent that can complete user instructions end-to-end by interacting with real-world websites.
 35 | 
 36 | ### 🔧 Key Features
 37 | 
 38 | - Autonomous interaction with vendor sites  
 39 | - Intelligent firmware file identification and retrieval  
 40 | - Multi-agent concurrent crawling  
 41 | - Distributed task scheduling
 42 | 
 43 | ### 📄 Core Files
 44 | 
 45 | - `crawler.py`: Core crawler logic  
 46 | - `web_intrect.py`: Web interaction controller  
 47 | - `mark_page.js`: Web element tagging script  
 48 | - `prompt.yaml`: Vendor-specific prompt configuration for LLM
 49 | 
 50 | ---
 51 | 
 52 | ## 🔍 Firmware Analysis System (FirmAnalyzer)
 53 | 
 54 | FirmAnalyzer aims to **mimic human-like reasoning when analyzing firmware behavior**, leveraging the semantic understanding and code interpretation capabilities of LLMs to autonomously **prioritize, interpret, and investigate potential security issues**.  
 55 | This design helps **alleviate the heavy workload typically required from security professionals** in manual firmware auditing.
 56 | 
 57 | 
 58 | ### 🛠️ Key Capabilities
 59 | 
 60 | - Firmware unpacking and filesystem detection  
 61 | - Static and semantic vulnerability detection  
 62 | - Binary disassembly and logic analysis  
 63 | - CVE correlation and risk scoring  
 64 | - Human-readable reports powered by LLMs
 65 | 
 66 | ### 📄 Core Files
 67 | 
 68 | - `run.py`: Entry point for analysis  
 69 | - `explore.py`: Filesystem exploration and metadata gathering  
 70 | - `analyze.py`: Firmware file analysis module  
 71 |   - **Sensitive Info Pattern Matching**: Regex and semantic pattern detection (preliminary filtering to guide LLM inspection and direction)  
 72 |   - **Shell Command Executor**: Executes Linux tools such as `cat`, `grep`, etc.  
 73 |   - **CVE Query Tool**: Queries vulnerability data through APIs  
 74 |   - **Disassembly Assistant**: Integrates `radare2` with LLM for binary reasoning  
 75 | - `requirements.yaml`: A user-configurable file that defines the overall analysis plan. It allows users to customize:
 76 |   - The **scope of analysis** and specific **target components**  
 77 |   - **Directory scanning priorities** (e.g., focus on `/etc`, `/bin`, or `/www`)  
 78 |   - **Security analysis strategies**, such as whether to perform code-level audits or pattern-based detections  
 79 |   - **Risk severity classification rules** to define what constitutes high/medium/low severity  
 80 |   - The **format and structure** of generated **reports and summaries**
 81 | ---
 82 | 
 83 | ## 📊 Example Outputs (Examples)
 84 | 
 85 | Contains complete logs and reports from analyzing firmware using **DeepSeek-v3** and **DeepSeek-r1** models.
 86 | 
 87 | ### 📝 Files
 88 | 
 89 | - `explore.log`: Full exploration log  
 90 | - `report.txt`: File-by-file security analysis  
 91 | - `summary.txt`: Overall security summary and risk level
 92 | 
 93 | ### 🤖 Model Performance Notes
 94 | 
 95 | We primarily use **DeepSeek-v3** and **DeepSeek-r1** for firmware analysis.  
 96 | In addition, **Claude-Sonnet-3.7** may demonstrates promising performance in code auditing tasks, especially for semantic reasoning and cross-file logic analysis.
 97 | DeepSeek offers lower costs, but we are actively experimenting and comparing results across multiple models to find the optimal configuration.
 98 | 
 99 | ---
100 | 
101 | ## ⚠️ Limitations and Challenges
102 | 
103 | ### Format & Semantic Limitations
104 | 
105 | - Inability to automatically decrypt or handle proprietary firmware formats  
106 | - LLMs may hallucinate when analyzing complex control flows  
107 | - Limited understanding of intricate build scripts and service configurations
108 | ---
109 | 
110 | ## 🚧 Roadmap
111 | 
112 | Upcoming work will focus on:
113 | 
114 | - **Integrating more static analysis tools**, especially for binary-focused workflows to improve analysis coverage and accuracy  
115 | - **Combining symbolic execution with LLMs** to enhance deep vulnerability discovery and validation  
116 | - **Exploring firmware runtime state analysis** (e.g., process behavior, service call graphs, and system responses) to prioritize high-risk issues
117 | 
118 | ---
119 | 
120 | ## 📌 Notes & Compliance
121 | 
122 | 1. All results are for **research purposes only**  
123 | 2. Please ensure legal and ethical use of the system  
124 | 3. Verification should be performed in sandboxed/test environments  
125 | 4. We are actively engaging with vendors to confirm findings and, under compliant conditions, release more security reports
126 | 
127 | ---
128 | 


--------------------------------------------------------------------------------
/firmanalyzer/CVEsearch.py:
--------------------------------------------------------------------------------
  1 | import os 
  2 | import re
  3 | import requests
  4 | import json
  5 | import time
  6 | from bs4 import BeautifulSoup  # Add BeautifulSoup for parsing HTML
  7 | from typing import List, Dict, Any
  8 | from client import create_openai_client
  9 | 
 10 | def parse_openai_response(response_text: str) -> List[Dict[str, str]]:
 11 |     """
 12 |     从LLM响应中提取并验证JSON数据
 13 |     返回结构示例：[{"cve_id": "CVE-XXXX-XXXX", "description": "..."}]
 14 |     """
 15 |     # 匹配JSON数组模式（支持多行）
 16 |     json_pattern = r'\[\s*\{.*?\}\s*\]'
 17 |     matches = re.finditer(json_pattern, response_text, re.DOTALL)
 18 |     
 19 |     valid_entries = []
 20 |     
 21 |     for match in matches:
 22 |         try:
 23 |             # 尝试解析JSON
 24 |             json_str = match.group()
 25 |             parsed = json.loads(json_str)
 26 |             
 27 |             # 验证数据结构
 28 |             if isinstance(parsed, list):
 29 |                 for entry in parsed:
 30 |                     if all(key in entry for key in ('cve_id', 'description')):
 31 |                         # 基础字段验证
 32 |                         valid_entry = {
 33 |                             'cve_id': str(entry['cve_id']).strip(),
 34 |                             'description': str(entry['description']).strip()
 35 |                         }
 36 |                         # 可选添加额外验证（如CVE ID格式）
 37 |                         if valid_entry['cve_id'].startswith('CVE-'):
 38 |                             valid_entries.append(valid_entry)
 39 |                         else:
 40 |                             print(f"Invalid CVE ID format: {valid_entry['cve_id']}")
 41 |             else:
 42 |                 print(f"Expected JSON array, got {type(parsed)}")
 43 |                 
 44 |         except json.JSONDecodeError as e:
 45 |             print(f"JSON解析失败: {str(e)}")
 46 |             print(f"Problematic JSON: {json_str}")
 47 |             
 48 |     return valid_entries
 49 | def parse_component_and_version(component: str) -> tuple:
 50 |     """使用正则表达式匹配版本号"""
 51 |     version_pattern = r"\b(v?\d+\.\d+[\w.]*)\b"
 52 |     match = re.search(version_pattern, component)
 53 |     if match:
 54 |         version = match.group(1)
 55 |         name = component.replace(version, "").strip()
 56 |         return name, version
 57 |     return component, ""
 58 | 
 59 | def parse_mitre_html(html_content, component_name, version):
 60 |     """Parse MITRE HTML response to extract CVE information"""
 61 |     soup = BeautifulSoup(html_content, 'html.parser')
 62 |     cve_items = []
 63 |     
 64 |     # Find tables (not dependent on specific ID)
 65 |     tables = soup.find_all('table')
 66 |     
 67 |     for table in tables:
 68 |         rows = table.find_all('tr')
 69 |         for row in rows:
 70 |             cells = row.find_all('td')
 71 |             if len(cells) >= 2:  # Ensure at least two columns
 72 |                 cve_cell = cells[0]
 73 |                 desc_cell = cells[1]
 74 |                 
 75 |                 # Find CVE ID
 76 |                 cve_link = cve_cell.find('a')
 77 |                 if cve_link and 'CVE-' in cve_link.text:
 78 |                     cve_id = cve_link.text.strip()
 79 |                     desc_text = desc_cell.text.strip()
 80 |                     
 81 |                     # Check if description contains component name (case insensitive)
 82 |                     if component_name.lower() in desc_text.lower():
 83 |                         cve_item = {
 84 |                             'cve_id': cve_id,
 85 |                             'description': desc_text,
 86 |                             'source': 'MITRE'
 87 |                         }
 88 |                         cve_items.append(cve_item)
 89 |     
 90 |     print(f"Found {len(cve_items)} related CVEs from MITRE")
 91 |     return cve_items
 92 | 
 93 | def analyze_cve_with_openai(component_name: str, version: str, search_results: Dict[str, Any]) -> List[str]:
 94 |     """Analyze CVE results using OpenAI, supporting batch processing"""
 95 |     # Extract all CVE entries from search results
 96 |     all_cves = []
 97 |     if search_results.get("mitre"):
 98 |         all_cves.extend(search_results["mitre"])
 99 |     
100 |     # Batch size
101 |     BATCH_SIZE = 15
102 |     analyzed_results = []
103 |     
104 |     # Process CVEs in batches
105 |     for i in range(0, len(all_cves), BATCH_SIZE):
106 |         batch = all_cves[i:i + BATCH_SIZE]
107 |         batch_num = i//BATCH_SIZE + 1
108 |         
109 |         # Prepare prompt
110 |         prompt = f"""
111 | Target Component: {component_name}{version}
112 | 
113 | Please analyze the following {len(batch)} CVEs to determine if they affect this version. Do not make extra inferences.
114 | {json.dumps(batch, indent=2)}
115 | 
116 | **Version Analysis Rules**:
117 | When analyzing CVEs:
118 |    - Only include CVEs where the vulnerable version range INCLUDES the component version
119 |    For example, if the component version is 1.01, and the CVE description mentions version through v1.02, it should be included.
120 | 
121 | Please return all matching CVEs in JSON format, otherwise return an empty list. Do not include any other content. Format as follows:
122 | '''
123 | [
124 |     {{
125 |         "cve_id": "CVE-ID",
126 |         "description": "Vulnerability description",
127 |     }}
128 | ]
129 | '''
130 | 
131 | """
132 |         print(prompt)
133 |         try:
134 |             # Call OpenAI API
135 |             model,client = create_openai_client()
136 |             response = client.chat.completions.create(
137 |                 model=model,
138 |                 messages=[
139 |                     {"role": "system", "content": "You are a security expert specializing in analyzing CVE vulnerability information to confirm which CVEs affect the target component."},
140 |                     {"role": "user", "content": prompt}
141 |                 ],
142 |                 temperature=0
143 |             )
144 |             # Get response text
145 |             if response.choices and response.choices[0].message:
146 |                 result_text = response.choices[0].message.content
147 |                 print(f"\n=== Batch {batch_num} Analysis Results ===")
148 |                 parsed_data = parse_openai_response(result_text)
149 |                 analyzed_results.extend(parsed_data)
150 |                 print(parsed_data)
151 |                 print(f"Analyzed {len(analyzed_results) * BATCH_SIZE}/{len(all_cves)} CVEs")
152 |             
153 |             # Add delay to avoid rate limits
154 |             time.sleep(1)
155 |             
156 |         except Exception as e:
157 |             print(f"Error processing batch {batch_num}: {e}")
158 |             continue
159 |     
160 |     print("\n=== Merging Analysis Results ===")
161 |     print(json.dumps(analyzed_results, indent=2, ensure_ascii=False))  # 修改这里
162 |     
163 |     return analyzed_results
164 | 
165 | def query_nvd_and_mitre(component: str, save_path: str = None):
166 |     """
167 |     Query CVE information for a component
168 |     :param component: Component name, e.g. "BusyBox 1.01" or "BusyBox v1.01" 
169 |     :param save_path: Optional path to save results to JSON file
170 |     """
171 |     # Parse component name and version
172 |     component_name, version = parse_component_and_version(component)
173 |     
174 |     try:
175 |         print(f"\nQuerying MITRE: {component}")
176 |         mitre_url = f"https://cve.mitre.org/cgi-bin/cvekey.cgi?keyword={component}"
177 |         mitre_response = requests.get(mitre_url)
178 |         
179 |         if mitre_response.status_code == 200:
180 |             mitre_results = parse_mitre_html(mitre_response.text, component_name, version)
181 |         else:
182 |             print(f"MITRE returned error status code: {mitre_response.status_code}")
183 |             mitre_results = None
184 |             
185 |     except Exception as e:
186 |         print(f"MITRE query error: {e}")
187 |         mitre_results = None
188 | 
189 |     # Integrate results
190 |     results = {
191 |         "mitre": mitre_results,
192 |         "component": component_name,
193 |         "version": version
194 |     }
195 | 
196 |     # Sort and limit results before analysis
197 |     if results["mitre"]:
198 |         # Sort CVEs by ID in descending order (newest first)
199 |         sorted_cves = sorted(results["mitre"], 
200 |                            key=lambda x: x['cve_id'], 
201 |                            reverse=True)
202 | 
203 |         results["mitre"] = sorted_cves[:100]
204 |         print(f"Limited to newest 100 CVEs from {len(sorted_cves)} total CVEs")
205 | 
206 |     # Analyze results using OpenAI
207 |     analyzed_results = analyze_cve_with_openai(component_name, version, results)
208 |     
209 |     # Save results if save_path provided
210 |     if save_path:
211 |         try:
212 |             os.makedirs(save_path, exist_ok=True)
213 |             output_file = os.path.join(save_path, "cve_search.txt")
214 |             with open(output_file, 'a', encoding="utf-8") as f:
215 |                 save_data = {
216 |                     "analyzed_results": analyzed_results
217 |                 }
218 |                 json.dump(save_data, f, indent=2)
219 |             print(f"Results saved to {output_file}")
220 |         except Exception as e:
221 |             print(f"Error saving results to file: {e}")
222 |         print(f"\n=== Final Results ===")
223 |     print(f"Total vulnerabilities found: {len(analyzed_results)}")
224 |     for idx, cve in enumerate(analyzed_results, 1):
225 |         print(f"{idx}. [{cve['cve_id']}] {cve['description'][:60]}...")
226 |     
227 |     return {
228 |         "raw_results": results,
229 |         "analyzed_results": analyzed_results
230 |     }
231 | 
232 | 
233 | if __name__ == "__main__":
234 |     components = [
235 |         "BusyBox 1.01",
236 |         "hostapd 2.0-devel",
237 |         "wpa_supplicant 2.0-devel"
238 |     ]
239 |     
240 |     print("Starting component vulnerability query...")
241 |     all_results = {}
242 |     for component in components:
243 |         print(f"\n=== Querying component: {component} ===")
244 |         results = query_nvd_and_mitre(component,"./cve_results")
245 |         all_results[component] = results
246 |         time.sleep(1)  # Add brief delay
247 |     
248 |     print("\nQuery complete")
249 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/buffalo/summary.txt:
--------------------------------------------------------------------------------
 1 | '''
 2 | Firmware Summary:
 3 | [Basic Info]
 4 | - Name/Version: Buffalo WSR1166DD Firmware v1.5.5
 5 | - Device/Type/Arch: Buffalo WSR1166DD, MIPS Architecture
 6 | - Key Info: Kernel version 4.4.25, Built on 2017-12-04
 7 | 
 8 | [Coverage] 
 9 | - Key Dirs: /bin, /lib/firmware, /sys/firmware, /sbin, /lib, /etc, /etc/ssl, /www
10 | - Key Files: /bin/busybox, /bin/ipcalc.sh, /bin/uclient-fetch, /bin/config_generate, /sbin/init, /sbin/netifd, /sbin/procd, /sbin/kmodloader, /sbin/logread, /sbin/fw3, /sbin/sysupgrade, /sbin/wifi, /lib/libc.so, /lib/libuci.so, /lib/libubox.so, /lib/uboot-envtools.sh, /lib/functions.sh, /etc/preinit, /etc/shadow, /etc/key-build.pub, /etc/sysctl.conf, /etc/rc.common, /etc/hotplug.json, /etc/profile, /etc/services, /etc/ssl/openssl.cnf, /etc/config/dropbear, /etc/config/uhttpd, /etc/config/ddns, /etc/config/etherwake, /etc/config/pptpd, /etc/config/rpcd, /etc/config/snmpd, /etc/init.d/dropbear, /etc/init.d/boot, /etc/init.d/embeddd, /etc/init.d/openvpn, /etc/init.d/pptpd, /etc/init.d/snmpd, /etc/ppp/options, /www/index.html, /etc/openvpn/server.conf, /lib/functions/preinit.sh, /lib/functions/uci-defaults.sh
11 | 
12 | [Main Issues]
13 | - Critical Issues:
14 |   - /etc/shadow: Root account has no password set (empty password field), confirmed by /etc/profile script warning, allowing unrestricted access and potential full system compromise.
15 |   - /etc/key-build.pub: Private key exposure ("private key 605c7f1ccfcc1f58") in a public file, risking unauthorized access to sensitive systems or data.
16 |   - /etc/ssl/openssl.cnf: References to private keys (cakey.pem, tsakey.pem) and placeholder passwords ('secret') expose sensitive cryptographic material. Weak hash algorithms (md5, sha1) are specified as acceptable message digests, increasing risks of collision attacks.
17 |   - /etc/config/uhttpd: Explicit reference to private key file (/etc/uhttpd.key). If improperly secured, it could allow decryption of HTTPS traffic or server impersonation.
18 |   - /bin/busybox: Multiple vulnerabilities (CVE-2019-5747, CVE-2021-28831, CVE-2018-20679, CVE-2017-16544, CVE-2017-15874, CVE-2017-15873, CVE-2016-6301, CVE-2015-9261, CVE-2022-30065, CVE-2021-42381, CVE-2023-42366, CVE-2023-42365, CVE-2023-42364, CVE-2023-42363) including heap-buffer-overflow, use-after-free, integer underflow/overflow, remote code execution, and denial of service risks.
19 |   - /etc/config/dropbear: 'PasswordAuth', 'RootPasswordAuth', and 'RootLogin' enabled by default, increasing brute force attack risks. Multiple CVEs identified (e.g., CVE-2023-48795, CVE-2021-36369, CVE-2020-36254, CVE-2019-12953, CVE-2018-15599) affecting Dropbear, with CVE-2023-48795 rated critical for integrity check bypass.
20 |   - /sbin/init: Use of insecure function sprintf without input validation or bounds checking at address 0x4015c8, increasing the risk of arbitrary code execution.
21 |   - /sbin/netifd: Format string vulnerabilities identified in printf (0x402974) and fprintf calls within sym._fini (0x4115a4).
22 |   - /sbin/procd: Absence of input validation or sanitization in the function chain leading to insecure functions like 'gets' and 'sscanf'.
23 |   - /sbin/fw3: Remote code execution vulnerability in `sym._init` due to insecure use of `gets` and dynamic code execution via `jalr t9`.
24 |   - /sbin/logread: OS Command Injection vulnerability (CVE-2023-29778) in logread component.
25 |   - /sbin/sysupgrade: '--restore-backup' option allows restoring configuration from a URL without proper validation, enabling arbitrary code execution if a malicious URL is provided.
26 |   - /sbin/wifi: Multiple critical vulnerabilities (CVE-2024-53940, CVE-2024-53939, CVE-2024-53937, CVE-2017-8772, CVE-2024-53938) including command injection, default credentials, and unauthenticated TELNET access.
27 |   - /lib/libc.so: Vulnerable to CVE-2019-14697, allowing out-of-bounds writes due to x87 floating-point stack adjustment imbalance. memcpy operation in sym.__init_ssp lacks input validation, and use of 'gets' in sym.bind_textdomain_codeset introduces buffer overflow risks.
28 |   - /etc/services: Insecure service configurations detected, including telnet (23/tcp), ftp (21/tcp), and finger (79/tcp), transmitting data in plaintext and exposing the system to interception and misuse.
29 |   - /etc/config/etherwake: Plaintext password (AABBCCDDEEFF) used for wake-on-LAN functionality, exposing sensitive credentials.
30 |   - /etc/config/pptpd: Plaintext credentials ('youruser'/'yourpass') and PPTP server IP configurations (local: 192.168.0.1, remote range: 192.168.0.20-30) exposed, increasing the risk of unauthorized access.
31 |   - /etc/config/snmpd: Default SNMP community strings "public" (read-only) and "private" (read-write) configured, exposing the system to unauthorized access and manipulation. Presence of outdated SNMP versions v1 and v2c increases risks of data interception and exploitation (CVE-2005-3722).
32 |   - /etc/init.d/boot: Hardcoded PSK (Pre-Shared Key) value 'FacWPAPSK1_BK=12345' exposes wireless network credentials, allowing unauthorized access if extracted.
33 |   - /etc/init.d/embeddd: Sensitive DDNS credentials (username, password, update_url) defined in plaintext within the script, risking exposure of authentication data.
34 |   - /etc/init.d/openvpn: Sensitive certificate and key data (ca_inline, cert_inline, key_inline, tls_inline) written in plaintext to `/var/run/ovpn.config`, and plaintext username/password written to `/var/run/ovpn_auth.txt` when user_pass_auth is enabled, risking exposure of cryptographic material and authentication data. Management interface bound to 127.0.0.1:14 without clear access restrictions, potentially allowing unauthorized control.
35 |   - /etc/init.d/pptpd: Plaintext password written to $CHAP_SECRETS file without encryption, exposing login credentials. Firewall rule allows unrestricted TCP access on port 1723, increasing exposure risks.
36 |   - /etc/ppp/options: Logging disabled by setting logfile to /dev/null, removing audit trails. Additionally, maxfail 0 permits unlimited failed connection attempts, increasing brute-force risks.
37 |   - /etc/openvpn/server.conf: Management interface bound to 127.0.0.1:14 without additional authentication mechanisms, posing a risk if improperly exposed externally.
38 |   - /lib/functions/uci-defaults.sh: Potential sensitive data exposure identified through patterns resembling password handling (e.g., 'local key="$2"', 'json_add_boolean "$key"'). If these handle credentials without proper security measures, it could lead to sensitive data exposure.
39 | 
40 | - Major Issues:
41 |   - /etc/sysctl.conf: Disabled bridge firewalling (net.bridge.bridge-nf-call-* set to 0) and enabled IP forwarding for IPv4 and IPv6 (net.ipv4.ip_forward=1, net.ipv6.conf.all.forwarding=1), increasing attack surface and potential exposure to network attacks.
42 |   - /lib/libuci.so: Affected by CVE-2020-28951, introducing use-after-free risks when handling malicious package names, potentially leading to memory corruption or privilege escalation.
43 |   - /lib/libubox.so: Affected by CVE-2020-7248, a stack-based buffer overflow in JSON serialization functionality, potentially allowing remote code execution.
44 |   - /sbin/kmodloader: Stack-based buffer overflow in __dn_expand function (CVE-2014-3484), affecting musl libc versions before 1.1.2 and versions 0.9.13 through 1.0.3.
45 |   - /lib/uboot-envtools.sh: Lack of input validation before writing configurations to /etc/fw_env.config, potentially allowing malicious configuration injection.
46 |   - /bin/ipcalc.sh: Lack of input validation and sanitization in ARGV handling within functions like ip2int(), int2ip(), and compl32().
47 |   - /etc/hotplug.json: Creation of device nodes with broad permissions (e.g., '0666') and insecure use of 'exec' to call external scripts like '/sbin/hotplug-call', risking unauthorized access and script execution.
48 |   - /etc/config/ddns: Explicit fields for username ("your_username") and password ("your_password") placeholders, which could expose credentials if replaced with actual values.
49 |   - /etc/config/rpcd: Plaintext username ('webuser') and password ('$p$webuser') stored in an insecure format, increasing the risk of unauthorized access.
50 |   - /etc/init.d/snmpd: Dynamic construction of SNMP configuration file (/var/run/snmpd.conf) using user-provided values (e.g., community strings, source IPs) without secure defaults or validation, risking unauthorized access.
51 |   - /www/index.html: Version information exposure ('1.1.0+b3321bb2') in the meta tag could allow attackers to identify and exploit known vulnerabilities associated with this specific version.
52 | 
53 | - Other Issues:
54 |   - /etc/preinit: Version information exposure ('2006-2016') could indicate outdated software components with potential unpatched vulnerabilities.
55 |   - /etc/rc.common: Version information exposure ('2006-2012') and insecure handling of service control variables ($START, $STOP) without proper validation, risking unintended service behavior or exposure.
56 |   - /bin/busybox: Exposure of sensitive content such as '/etc/passwd' and '/etc/shadow' strings.
57 |   - /bin/config_generate: Default credentials ('username'/'password') embedded in plaintext for PPPoE configuration.
58 |   - /bin/uclient-fetch: Presence of '--password=<password>' string indicates potential insecure handling or exposure of credentials.
59 |   - /lib/functions.sh: Code injection risk in append function due to unsanitized use of 'eval' with user-controlled variables $var and $value. Exposure of version information ("Copyright (C) 2006-2014 OpenWrt.org") could help attackers identify outdated software.
60 | '''
61 | 
62 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/dlink/DAP-2690_REVB_FIRMWARE_3.16.RC100_WW/summary.txt:
--------------------------------------------------------------------------------
 1 | ```
 2 | Firmware Summary:
 3 | [Basic Info]
 4 | - Name/Version: DAP-2690_REVB_FIRMWARE_3.16.RC100_WW
 5 | - Device/Type/Arch: DAP-2690 / Wireless Access Point / MIPS
 6 | - Key Info: Created 2016-03-21, BusyBox v1.14.1, SquashFS v4.0
 7 | 
 8 | [Coverage] 
 9 | - Key Dirs: /bin, /etc, /etc/cert, /etc/config, /etc/ssh, /bin/busybox.extracted, /sbin, /htdocs, /www, /lib, /usr
10 | - Key Files: /bin/busybox, /bin/ip, /bin/iplink, /bin/iproute, /bin/ping, /bin/ping6, /bin/sh, /bin/ps, /bin/mount, /bin/umount, /etc/cert/key.pem, /etc/config/defaultvalue.gz, /etc/ssh/ssh_host_dsa_key, /sbin/init, /sbin/hostapd, /sbin/httpd, /sbin/wpa_supplicant, /sbin/ifconfig, /sbin/insmod, /sbin/iwconfig, /sbin/iwlist, /sbin/iwpriv, /sbin/klogd, /sbin/lsmod, /sbin/mdev, /sbin/modprobe, /sbin/rmmod, /sbin/route, /sbin/sysctl, /sbin/syslogd, /sbin/tunctl, /sbin/vconfig, /sbin/wlanconfig, /sbin/ebtables, /sbin/ebtables-restore, /sbin/ebtables-save
11 | 
12 | [Main Issues]
13 | - Critical Issues: 
14 |   - /bin/busybox, /bin/iproute, /bin/ping, /bin/ping6, /bin/sh, /bin/ps, /bin/mount, /bin/umount, /sbin/init, /sbin/ifconfig, /sbin/insmod, /sbin/lsmod, /sbin/mdev, /sbin/modprobe, /sbin/rmmod, /sbin/route, /sbin/sysctl, /sbin/tunctl, /sbin/vconfig: Multiple critical CVEs (CVE-2022-48174, CVE-2022-30065, CVE-2022-28391, CVE-2021-42386, CVE-2018-20679, CVE-2021-42373-86) in BusyBox v1.14.1 leading to RCE, stack overflow, and use-after-free vulnerabilities
15 |   - /bin/busybox, /bin/ip, /bin/iplink, /bin/ping6, /bin/sh, /bin/ps, /bin/mount, /sbin/init, /sbin/ifconfig, /sbin/lsmod, /sbin/mdev, /sbin/modprobe, /sbin/route, /sbin/tunctl, /sbin/vconfig: Unsafe function usage (gets, fgets, strcpy) without bounds checking in multiple functions (fcn.00415988, fcn.00408a2c, fcn.0040bf38, fcn.0041ca1c, fcn.00419880, fcn.00443400, fcn.00445598, fcn.0040fe9c)
16 |   - /sbin/httpd: Multiple critical vulnerabilities in httpd v1.3.6 (CVE-2007-3304, CVE-2007-3847, CVE-2007-5000) including buffer overflow and remote code execution
17 |   - /sbin/httpd: Unsafe function usage (memcpy, strcpy) without bounds checking in functions (fcn.0040d3d4, sym.process_request) risking RCE
18 |   - /sbin/hostapd: Multiple CVEs (CVE-2022-23304, CVE-2019-9499, CVE-2016-4476) in hostapd v0.8.x allowing side-channel attacks, authentication bypass, and DoS
19 |   - /sbin/wpa_supplicant: Multiple CVEs (CVE-2023-52160, CVE-2022-23304, CVE-2022-23303, CVE-2021-27803, CVE-2019-9496) in wpa_supplicant v3.3.2 allowing authentication bypass, side-channel attacks, and DoS
20 |   - /sbin/iwconfig, /sbin/iwlist, /sbin/iwpriv: Multiple high-risk vulnerabilities including buffer overflows (fcn.00403850, sym.iw_enum_devices, sym.iw_get_stats, fcn.00406440, sym.iw_print_key) due to improper use of `fgets`, `memcpy`, `strncpy`, and `strcpy` without bounds checking, risking RCE and memory corruption
21 |   - /sbin/klogd: Critical vulnerabilities in klogd v1.3.6 (CVE-2001-0738) and unsafe function usage (strcpy, sprintf, system) in functions (fcn.00400d54, fcn.00403538, fcn.00402890, fcn.00403d08) risking buffer overflow, command injection, and format string vulnerabilities
22 |   - /sbin/syslogd: Critical vulnerabilities in functions (fcn.004017b0, fcn.00402be4, fcn.00404e00, fcn.0040275c) due to insecure function usage (`sprintf`, `popen`, `strcpy`) and lack of input validation, risking buffer overflow, command injection, and format string vulnerabilities
23 |   - /sbin/vconfig: Critical vulnerabilities in functions (fcn.00415988, fcn.00408a2c, fcn.0040bf38) due to insecure function usage (gets, strcpy, fgets) and lack of input validation, risking buffer overflow and arbitrary code execution
24 |   - /sbin/ebtables-restore: Format string vulnerability in `main` function and critical use of `gets` in `entry0` function, risking RCE and privilege escalation
25 |   - /sbin/ebtables-save: Command injection vulnerability due to insecure use of backticks and environment variables (`EBTABLES_SAVE_COUNTER`), risking arbitrary command execution
26 | 
27 | - Major Issues:
28 |   - /etc/cert/key.pem: Private key stored in firmware without proper protection
29 |   - /etc/ssh/ssh_host_dsa_key: SSH host key stored in firmware
30 |   - /sbin/httpd: IP addresses (171.10.37, 39.32.9) embedded in version strings exposing sensitive network information
31 |   - /sbin/insmod: Multiple CVEs (CVE-2018-7170, CVE-2018-7171, CVE-2018-7172) in sed v4.0 allowing buffer overflow and arbitrary code execution
32 |   - /sbin/iwconfig, /sbin/iwlist, /sbin/iwpriv: Version information exposure (4.3.3, 3.3.2, 2.4, 2.0, 802.11) and insecure memory handling in functions (fcn.00401758, fcn.00404878, fcn.0040143c, fcn.00401f40, fcn.00406358) risking format string vulnerabilities and unvalidated input exploitation
33 |   - /sbin/wlanconfig, /sbin/ebtables: Version information exposure (3.3.2, 4.3.3, 2.0) which could be used to identify potential vulnerabilities
34 | 
35 | - Other Issues:
36 |   - /etc/config/defaultvalue.gz: Contains default configuration values that could be exploited if not properly secured
37 |   - /sbin/init, /sbin/hostapd, /sbin/httpd, /sbin/wpa_supplicant, /sbin/ifconfig, /sbin/insmod, /sbin/lsmod, /sbin/mdev, /sbin/modprobe, /sbin/rmmod, /sbin/route, /sbin/sysctl, /sbin/tunctl, /sbin/vconfig, /sbin/wlanconfig, /sbin/ebtables: Version information exposure (BusyBox v1.14.1, sed v4.0, hostapd v0.8.x, httpd v1.3.6, wpa_supplicant v3.3.2) that could be used to identify potential vulnerabilities
38 | ```
39 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/dlink/DAP-3662/summary.txt:
--------------------------------------------------------------------------------
 1 | '''
 2 | Firmware Summary:
 3 | [Basic Info]
 4 | - Name/Version: DAP-3662 REVA FIRMWARE 1.00RC015
 5 | - Device/Type/Arch: DAP-3662 / Linux / MIPS
 6 | - Key Info: Kernel version 2.6.31, created 2015-01-20
 7 | 
 8 | [Coverage] 
 9 | - Key Dirs: /bin, /dev, /etc, /lib, /root, /sbin, /www
10 | - Key Files: bin/busybox, etc/ssh/ssh_host_dsa_key, etc/ssh/ssh_host_rsa_key, lib/libcrypto.so.0.9.8, lib/libssl.so.0.9.8, lib/ld-uClibc.so.0, lib/libc.so.0, lib/libradiusclient-ng.so.2, lib/libz.so.1.2.3, lib/libpthread.so.0, lib/libqc98xx.so, sbin/hostapd, sbin/httpd, sbin/ebtables, sbin/ebtables-restore, sbin/wpa_supplicant, sbin/iwconfig, sbin/iwpriv, sbin/klogd, sbin/syslogd, www/onlanchange.php, www/adv_array_auth.php, www/adv_array_scan.php, www/adv_captivals.php, www/adv_url_addr.php, www/__action.php, www/__action_bsc.php, www/__action_dhcp_server.php, www/adv_ap_array.php, www/adv_mssid.php, www/bsc_capwap.php, www/bsc_lan.php, www/bsc_wlan.php, www/st_device.php, www/st_stats_lan.php, www/st_wds_info.php, www/tool_admin.php, www/adv_acl.php, www/adv_array_config.php, www/adv_8021q_s.php, www/adv_qos.php, www/adv_radiusserver.php, www/adv_url.php, www/check_radiusclient.php, www/sys_cfg_valid.php, www/sys_fw_update.php, www/sys_setting.php, www/tool_sntp.php, www/login.php, www/session_login.php, www/adv_dhcpd.php, www/adv_mdhcpd.php, www/adv_arpspoofing.php, www/adv_8021q.php, www/adv_radiusclient.php, www/st_log.php
11 | 
12 | [Main Issues]
13 | - Critical Issues: 
14 |   [bin/busybox]: Contains two high-risk functions (fcn.004120cc and fcn.00427b4c) using 'system' with dynamic input, exposing command injection vulnerabilities. Environment variables processed without validation in fcn.00427b4c.
15 |   [bin/busybox]: Vulnerable to CVE-2021-28831 (invalid free/segmentation fault) and CVE-2019-5747 (out-of-bounds read) due to outdated version 1.14.1.
16 |   [etc/ssh/ssh_host_dsa_key]: Contains exposed DSA private key, leading to potential unauthorized access if compromised.
17 |   [etc/ssh/ssh_host_rsa_key]: Contains exposed RSA private key, leading to potential unauthorized access if compromised.
18 |   [lib/libcrypto.so.0.9.8]: Outdated version (0.9.8za) vulnerable to CVE-2019-1547 (ECDSA key recovery) and contains potential password string 'SGCKEYSALT'.
19 |   [lib/libssl.so.0.9.8]: Outdated version (0.9.8za) vulnerable to CVE-2008-1678 (memory leak) and contains high-risk vulnerabilities in 'sym.dtls1_read_bytes' (buffer overflow) and 'sym.dtls1_read_failed' (format string).
20 |   [lib/ld-uClibc.so.0]: Outdated version (1.7.0) vulnerable to CVE-2022-30295 (DNS cache poisoning), CVE-2022-29503 (memory corruption), CVE-2017-9729 (stack exhaustion), and CVE-2017-9728 (out-of-bounds read).
21 |   [lib/libc.so.0]: Vulnerable to CVE-2018-1000001 (buffer underflow in realpath()) and contains critical vulnerabilities in memcpy and fread_unlocked functions due to lack of bounds checking, leading to potential remote code execution.
22 |   [lib/libradiusclient-ng.so.2]: Critical buffer overflow vulnerabilities in `sym.rc_read_dictionary` function due to insecure use of `fgets` and `strcpy` without proper bounds checking or input validation.
23 |   [lib/libz.so.1.2.3]: Vulnerable to multiple CVEs (CVE-2018-25032, CVE-2005-2096, CVE-2005-1849, CVE-2004-0797, CVE-2002-0059) including memory corruption, buffer overflow, and denial of service issues.
24 |   [lib/libpthread.so.0]: Vulnerable to CVE-2022-29503 (memory corruption) and contains critical indirect function call vulnerability in 'sym.pthread_attr_getschedparam' leading to potential control flow hijacking and remote code execution.
25 |   [lib/libqc98xx.so]: Critical buffer overflow vulnerabilities in 'sym.art_otpRead' (indirect control via gp register) and 'sym.art_memRead' (memcpy in loop without bounds checking), leading to potential memory corruption and remote code execution.
26 |   [sbin/hostapd]: Linked to outdated OpenSSL libraries (libssl.so.0.9.8, libcrypto.so.0.9.8) known to have critical vulnerabilities like Heartbleed (CVE-2014-0160), CVE-2008-1678 (memory leak), and CVE-2019-1547 (ECDSA key recovery).
27 |   [sbin/iwconfig]: Function fcn.00403568 contains buffer overflow vulnerability (strcpy without length checks) and format string vulnerability (sscanf with limited input validation), allowing remote code execution.
28 |   [sbin/iwpriv]: Critical format string vulnerability in sym.iw_get_priv_info function (printf with unvalidated user input), exposing remote code execution risk.
29 |   [sbin/klogd]: Command injection and buffer overflow vulnerabilities in function fcn.00400d54 (system calls with hardcoded commands and strcpy without bounds checking), accessible from main function.
30 |   [sbin/klogd]: Vulnerable to CVE-2001-0738 (DoS via null bytes in log messages) due to detected version 1.3.6.
31 |   [www/onlanchange.php]: Command injection vulnerability in `query()` function without proper input validation, allowing malicious command execution if input is controlled by attacker.
32 |   [www/adv_captivals.php]: Exposure of sensitive credentials including RADIUS server secrets ($cfg_radius_sec, $cfg_acc_sec) and LDAP passwords ($cfg_ldap_password) in the code, with potential risk even if encrypted via 'queryEnc' function.
33 |   [www/adv_url_addr.php]: Insecure handling and storage of passwords in code segments like 'var r_list=[['index','name','passwd','status']' and 'echo ",
34 |  ['".$@."','".get("j","name")."','".queryEnc("passwd")."','".query("enable")."']";'.
35 |   [www/__action.php]: Hardcoded file paths like '/var/proc/web/session:'.$sid.'/user/group' and '/www/permission_deny.php' could be exploited if not properly secured. Sensitive information such as user_name, new_password, and other configuration details are exposed in HTML comments.
36 |   [www/__action_bsc.php]: Hardcoded password/key exposure in 'echo "key = ". $f_key ."\n";' at line 96, revealing sensitive configuration parameters (f_auth, f_cipher, f_key, f_radius_srv_1, f_radius_sec_1) without proper protection.
37 |   [www/__action_dhcp_server.php]: Insecure configuration handling and lack of input validation for user-supplied variables (srv_enable, ipaddr, f_endip), allowing potential injection or manipulation of DHCP server settings.
38 |   [www/adv_ap_array.php]: Password exposure in 'ap_array_pwd' field and version information disclosure ('m_version', 'ap_array_ver'), with potential insecure handling of encrypted query data via 'queryEnc' function.
39 |   [www/adv_mssid.php]: Exposure of sensitive network credentials and configurations, including WEP keys, WPA PSK, and RADIUS secrets, through the `queryEnc` function.
40 |   [www/bsc_capwap.php]: Potential hardcoded credentials and sensitive configurations detected, including 'admin:password' and 'API_KEY=12345'. Missing '__admin_check.php' file could lead to unauthorized access.
41 |   [www/bsc_wlan.php]: Insecure WEP key handling and weak password validation practices, including plaintext WEP key references and weak validation logic.
42 |   [www/st_device.php]: Active use and configuration of WEP encryption for both 2.4GHz and 5GHz networks, exposing the network to security risks such as eavesdropping and unauthorized access.
43 |   [www/st_stats_lan.php]: Hardcoded database credentials (username: 'admin', password: 'admin123') and sensitive configuration data exposed in plaintext.
44 |   [www/st_wds_info.php]: Hardcoded database credentials (username: 'admin', password: 'password123') and API keys ('api_key=1234567890abcdef') exposed in plaintext.
45 |   [www/tool_admin.php]: Password handling logic with weak validation and no encryption or hashing mechanisms detected, leaving passwords potentially exposed in plaintext.
46 |   [www/adv_acl.php]: File upload vulnerability in form "frm_acl" with insufficient input validation, only checking file extension (".acl") without content validation, allowing potential malicious file uploads.
47 |   [www/adv_radiusserver.php]: Insecure password handling with plaintext storage, no encryption or hashing mechanisms, and potential hardcoded credentials. Lack of input validation and access control mechanisms.
48 |   [www/adv_url.php]: Insecure password handling and storage with plaintext references and unclear encryption implementation in 'queryEnc' function.
49 |   [www/check_radiusclient.php]: Insecure file handling and session management issues using `unlink` to delete session-related files without proper validation or sanitization, potentially leading to unintended file deletion or manipulation.
50 |   [www/sys_fw_update.php]: Insecure session and authentication configurations explicitly disabling authentication (`$NO_NEED_AUTH="1";`) and session timeout (`$NO_SESSION_TIMEOUT="1";`), allowing unauthorized access or session hijacking.
51 |   [www/sys_setting.php]: Lack of CSRF protection in critical functions (`do_reboot()`, `do_factory_reset()`, `do_clear_language()`), allowing potential CSRF attacks to execute unintended actions.
52 |   [www/tool_sntp.php]: Use of hardcoded, potentially untrusted NTP server IP '207.232.83.70', exposing the device to time synchronization attacks or exploitation if the server is compromised.
53 |   [www/login.php]: Insecure handling of session cookies and lack of secure cookie attributes (HttpOnly, Secure), exposing session cookies to theft via XSS or man-in-the-middle attacks.
54 |   [www/session_login.php]: Exposure of client MAC addresses and IP addresses through PHP variables embedded in JavaScript, leading to potential information disclosure.
55 |   [www/adv_dhcpd.php]: Exposure of IP address and network configuration details, including DHCP server pool settings and LAN IP addresses, which could be exploited if accessed by unauthorized users.
56 |   [www/adv_mdhcpd.php]: Potential input validation issues in IP address handling functions (is_valid_ip3, is_valid_mask, invalid_ip_mask), leading to IP spoofing or misconfiguration.
57 |   [www/adv_arpspoofing.php]: Insecure handling of IP and MAC addresses without proper input validation or sanitization, potentially leading to injection attacks or unauthorized access to network data.
58 |   [www/adv_8021q.php]: Potential injection vulnerabilities due to dynamic script generation using variables without clear input validation or sanitization.
59 |   [www/adv_radiusclient.php]: Potential exposure of RADIUS server IP and password in the HTML form, though the password field is masked as a password input type.
60 |   [www/st_log.php]: The 'doClear()' function allows clearing system logs, which could be exploited to erase evidence of malicious activity. While it is restricted to users with 'AUTH_GROUP' set to '0', this restriction relies on the integrity of the authentication mechanism.
61 | 
62 | - Major Issues: 
63 |   [bin/busybox]: Exposes root credential (USER=root) and version information (v1.14.1, 1.14.1, 9.9) which could be exploited if used insecurely.
64 |   [sbin/hostapd]: Contains version strings 'v2.0-devel' exposing outdated software version, and sensitive content (URLs, IPs, email). Handles sensitive cryptographic material (WEP keys, EAPOL-Key, MPPE keys) with potential exposure risk.
65 |   [sbin/httpd]: Exposes firmware version path '/runtime/sys/info/firmwareversion' and HTTP version error message indicating potential misconfigurations.
66 |   [sbin/wpa_supplicant]: Exposes version 'v2.0-devel' and contains sensitive information (WEP/WPA keys, EAPOL-Key frames) with potential network service exposure (IPs, URLs).
67 |   [sbin/ebtables, sbin/ebtables-restore]: Potentially vulnerable to multiple CVEs including CVE-2022-48641 (memory leak), CVE-2011-1080 (information disclosure), CVE-2010-0007 (access control bypass), and CVE-2005-3110 (DoS).
68 |   [sbin/syslogd]: Potential format string vulnerability in function fcn.004011f0 (printf with hardcoded string format without input validation), accessible from privileged contexts.
69 |   [www/adv_array_auth.php]: Sensitive data exposure in JavaScript arrays (`ar_auth_list` and `serial_list`) containing 'name', 'password', 'group', 'number', 'duration', 'enddate', and 'device' embedded directly in HTML output.
70 |   [www/adv_array_scan.php]: Exposure of sensitive configuration data (WLAN settings, AP array passwords, IPv6 status) and debug information in HTML output.
71 |   [www/bsc_lan.php]: Potential sensitive information exposure in debug comments, including IP addresses, netmask, gateway, and DNS settings.
72 |   [www/adv_array_config.php]: Sensitive configuration exposure through debug output (`echo "<!--debug";`) revealing WLAN settings, security parameters, and system configurations.
73 |   [www/adv_8021q_s.php]: Potential sensitive information exposure including IP addresses, URLs, and API tokens detected in multiple instances.
74 |   [www/adv_qos.php]: Potential access control issue due to missing or improperly implemented '__admin_check.php' file, leading to unauthorized access to administrative functions.
75 |   [www/sys_cfg_valid.php]: Potential exposure of configuration parameters and insecure handling of query results, directly using query results (`$cfg_mode` and `$cfg_mssid`) in JavaScript without proper validation or sanitization, leading to XSS or other injection vulnerabilities.
76 | '''
77 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/dlink/DAP-3662/token_usage.jsonl:
--------------------------------------------------------------------------------
 1 | {"input_cost": 0.00135, "output_cost": 0.00076, "total_cost": 0.00211}
 2 | {"input_cost": 0.00135, "output_cost": 0.00058, "total_cost": 0.00193}
 3 | {"input_cost": 0.0094225, "output_cost": 0.0005600000000000001, "total_cost": 0.0099825}
 4 | {"input_cost": 0.0015225000000000002, "output_cost": 0.00031, "total_cost": 0.011815}
 5 | {"input_cost": 0.00135, "output_cost": 0.00058, "total_cost": 0.00193}
 6 | {"input_cost": 0.0019000000000000002, "output_cost": 0.00079, "total_cost": 0.00269}
 7 | {"input_cost": 0.004900000000000001, "output_cost": 0.0026000000000000003, "total_cost": 0.010190000000000001}
 8 | {"input_cost": 0.0015275000000000002, "output_cost": 0.00027, "total_cost": 0.0017975000000000003}
 9 | {"input_cost": 0.0032825000000000003, "output_cost": 0.00099, "total_cost": 0.0042725}
10 | {"input_cost": 0.006005000000000001, "output_cost": 0.00266, "total_cost": 0.012937500000000001}
11 | {"input_cost": 0.001515, "output_cost": 0.00028000000000000003, "total_cost": 0.0017950000000000002}
12 | {"input_cost": 0.0047375, "output_cost": 0.00088, "total_cost": 0.0056175}
13 | {"input_cost": 0.0014825, "output_cost": 0.00124, "total_cost": 0.00834}
14 | {"input_cost": 0.00135, "output_cost": 0.00058, "total_cost": 0.00193}
15 | {"input_cost": 0.0048725, "output_cost": 0.0009400000000000001, "total_cost": 0.0058125}
16 | {"input_cost": 0.0019375000000000002, "output_cost": 0.0025700000000000002, "total_cost": 0.01032}
17 | {"input_cost": 0.0014275000000000002, "output_cost": 0.00036, "total_cost": 0.0017875000000000002}
18 | {"input_cost": 0.005052500000000001, "output_cost": 0.00079, "total_cost": 0.0058425000000000005}
19 | {"input_cost": 0.0029200000000000003, "output_cost": 0.00027, "total_cost": 0.0090325}
20 | {"input_cost": 0.00144, "output_cost": 0.00030000000000000003, "total_cost": 0.0017400000000000002}
21 | {"input_cost": 0.0050225, "output_cost": 0.001, "total_cost": 0.0060225}
22 | {"input_cost": 0.005812500000000001, "output_cost": 0.0059900000000000005, "total_cost": 0.017825}
23 | {"input_cost": 0.0058025, "output_cost": 0.00442, "total_cost": 0.0102225}
24 | {"input_cost": 0.004465, "output_cost": 0.0030800000000000003, "total_cost": 0.0075450000000000005}
25 | {"input_cost": 0.00135, "output_cost": 0.00058, "total_cost": 0.00193}
26 | {"input_cost": 0.009725000000000001, "output_cost": 0.00018, "total_cost": 0.009905}
27 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/mikrotik/routeros-7.5-mipsbe/summary.txt:
--------------------------------------------------------------------------------
 1 | ```
 2 | Firmware Summary:
 3 | [Basic Info]
 4 | - Name/Version: MikroTik RouterOS 7.5
 5 | - Device/Type/Arch: Router/MIPS/Big Endian
 6 | - Key Info: Created 2022-08-30, Kernel version not specified
 7 | 
 8 | [Coverage] 
 9 | - Key Dirs: /sbin, /bndl, /home/web/webfig, /etc, /lib, /lib/modules/5.6.3/kernel/crypto, /lib/modules/5.6.3/misc, /lib/modules/5.6.3/net, /lib/modules/5.6.3/drivers/char, /lib/modules/5.6.3/drivers/net, /lib/modules/5.6.3/kernel/arch, /lib/modules/5.6.3/kernel/drivers, /lib/modules/5.6.3/kernel/fs, /lib/modules/5.6.3/kernel/lib, /lib/modules/5.6.3/kernel/net
10 | - Key Files: /sbin/sysinit, /bndl/*/*.jg.gz, /home/web/webfig/iframe.html.gz, /etc/qca8719L-7.5.fwf, /etc/qca9531L-7.5.fwf, /lib/libcrypto.so.1.0.0, /lib/libc.so, /lib/libeap.so, /lib/libjson.so, /lib/modules/5.6.3/kernel/crypto/sha1_generic.ko, /lib/modules/5.6.3/kernel/crypto/sha512_generic.ko, /lib/modules/5.6.3/kernel/net/ipv4/ip_tunnel.ko, /lib/modules/5.6.3/kernel/net/ipv4/udp_tunnel.ko, /lib/modules/5.6.3/kernel/net/ipv6/ipv6.ko, /lib/modules/5.6.3/kernel/net/ipv6/ah6.ko, /lib/modules/5.6.3/kernel/net/ipv6/esp6.ko, /lib/modules/5.6.3/kernel/net/ipv6/ip6_udp_tunnel.ko, /lib/modules/5.6.3/net/bridge/bridge2_netfilter.ko, /lib/modules/5.6.3/net/bridge/bridge2.ko, /lib/modules/5.6.3/net/netfilter/xt_tls.ko, /lib/modules/5.6.3/kernel/net/ipv6/netfilter/nf_defrag_ipv6.ko, /lib/modules/5.6.3/kernel/net/ipv6/netfilter/nf_reject_ipv6.ko
11 | 
12 | [Main Issues]
13 | - Critical Issues:
14 |   - /sbin/sysinit: Binary appears packed/obfuscated (i~packer command detected), hindering static analysis and potentially concealing malicious behavior
15 |   - /bndl/hotspot/home/web/hotspot/login.html: Contains embedded SVG image (offset 0x637) which could be used for XSS or other web-based attacks
16 |   - /etc/qca8719L-7.5.fwf: Contains TFTP-related functionality ("Illegal TFTP Operation" string found), exposing device to potential unauthorized firmware updates or configuration changes
17 |   - /lib/libcrypto.so.1.0.0: Outdated OpenSSL 1.0.2 with multiple critical vulnerabilities (CVE-2022-2068, CVE-2022-1292, CVE-2022-0778) that could lead to command injection, DoS, and private key exposure
18 |   - /lib/libc.so: Multiple critical vulnerabilities in musl libc 1.1.6, including unsafe `strcpy` usage in dynamic linking functions and stack-based buffer overflows (CVE-2019-14697, CVE-2015-1817, CVE-2014-3484)
19 |   - /lib/modules/5.6.3/kernel/crypto/sha512_generic.ko: Contains critical vulnerabilities including unbounded memory operations (e.g., `memset` with hardcoded size 0xd0), potential infinite loops, and risky `memcpy` calls without bounds checking, which could lead to memory corruption, denial-of-service, or remote code execution
20 |   - /lib/modules/5.6.3/kernel/fs/ext4/ext4.ko: Multiple critical CVEs including CVE-2022-48631 (extents parsing bug), CVE-2019-11833 (uninitialized memory exposure), and others related to denial of service and NULL pointer dereference vulnerabilities, risking system crashes and data exposure
21 |   - /lib/modules/5.6.3/kernel/drivers/net/wireguard/wireguard.ko: Contains version strings (1.0.0, 5.6.3, 11.1.0) indicating potential exposure to CVE-2021-46873 (affects WireGuard 0.5.3 and earlier), risking private key leakage and other security issues
22 |   - /lib/modules/5.6.3/kernel/net/mpls/mpls_router.ko: Contains critical vulnerabilities including buffer overflow risks (multiple `memcpy` calls without bounds checking), uninitialized variables, lack of input validation, and complex control flow susceptible to manipulation, increasing the risk of remote exploitation
23 |   - /lib/modules/5.6.3/kernel/fs/fat/fat.ko: Contains version strings (5.6.3 and 11.1.0) and is potentially vulnerable to CVE-2020-5203 (arbitrary code execution via Fat-Free Framework's Clear method)
24 |   - /lib/modules/5.6.3/kernel/fs/fat/vfat.ko: Contains critical vulnerabilities including uninitialized variables, buffer overflow risks in `memcpy` calls (e.g., at 0x80018d8, 0x8000e90, and 0x8001678), and insufficient input validation, which could lead to remote code execution or privilege escalation
25 |   - /lib/modules/5.6.3/kernel/drivers/net/ethernet/intel/e100.ko: Contains critical vulnerabilities including use-after-free bug (CVE-2022-49026), unvalidated `memcpy` calls, and dynamic loading risks (`dlopen`, `dlsym`), leading to potential remote code execution or system crashes
26 |   - /lib/modules/5.6.3/kernel/net/unix/unix.ko: Contains critical vulnerabilities including uninitialized variables, risky `memcpy` calls without bounds checking, and complex control flow susceptible to manipulation. Function `sym.unix_gc` at address `0x80042f0` is particularly vulnerable to buffer overflow and use-after-free attacks.
27 |   - /lib/modules/5.6.3/kernel/fs/jbd2/jbd2.ko: Contains critical vulnerabilities in functions such as `sym.jbd2_journal_commit_transaction`, `fcn.08004658`, and `sym.jbd2_journal_write_revoke_records` due to unsafe `memcpy` usage without bounds checking, insufficient error handling, and unvalidated size parameters, leading to memory corruption, privilege escalation, and arbitrary code execution.
28 |   - /lib/modules/5.6.3/kernel/drivers/usb/core/usbcore.ko: Contains version strings ('5.6.3', '11.1.0') exposing potential vulnerabilities associated with these versions, increasing attack surface
29 |   - /lib/modules/5.6.3/kernel/drivers/usb/host/ohci-hcd.ko: Contains critical vulnerabilities including direct `system` calls without input validation in `sym.ohci_hub_control` (0x80016a4) and `fcn.08002740` (0x8002740), uninitialized variables, and memory corruption risks, leading to potential command injection, arbitrary code execution, or privilege escalation
30 |   - /lib/modules/5.6.3/kernel/drivers/usb/storage/usb-storage.ko: Contains critical vulnerabilities including unsafe `memcpy` usage in `sym.usb_stor_access_xfer_buf` and `sym.usb_stor_invoke_transport`, lack of input validation, and potential for buffer overflows, leading to remote code execution, memory corruption, and data exposure
31 | 
32 | - Major Issues:
33 |   - Multiple compressed web interface files (*.jg.gz) in /bndl and /home/web/webfig directories lack integrity checks, making them vulnerable to tampering
34 |   - /etc: Contains potential sensitive system configuration files without clear access controls or integrity verification
35 |   - /etc/qca9531L-7.5.fwf: Contains hardware/firmware identifiers ("QCA953x", "alpha2", "crs125g") and boot process details that could aid attackers in targeting known vulnerabilities
36 |   - /lib/libeap.so: Potential insecure handling of authentication and encryption mechanisms, with references to sensitive information like 'password', 'key', and 'token'
37 |   - /lib/libjson.so: Contains token validation logic ('Invalid token:' string found) with potential security implications if improperly implemented, and lacks version information making vulnerability assessment difficult
38 |   - /lib/modules/5.6.3/kernel/drivers/net: Contains multiple network driver modules with potential vulnerabilities in packet handling and network interface management
39 |   - /lib/modules/5.6.3/kernel/drivers/usb: Contains USB driver modules with potential vulnerabilities in device handling and data transfer
40 |   - /lib/modules/5.6.3/kernel/fs/configfs, /lib/modules/5.6.3/kernel/fs/fat, /lib/modules/5.6.3/kernel/fs/jbd2, /lib/modules/5.6.3/kernel/fs/nls: Filesystem-related security risks in data handling and storage
41 |   - /lib/modules/5.6.3/kernel/net/rfkill, /lib/modules/5.6.3/kernel/net/sched, /lib/modules/5.6.3/kernel/net/unix, /lib/modules/5.6.3/net/ipv4/netfilter: Potential kernel module vulnerabilities in network traffic handling and filtering
42 |   - /lib/modules/5.6.3/kernel/drivers/usb/class, /lib/modules/5.6.3/kernel/drivers/usb/common, /lib/modules/5.6.3/kernel/drivers/usb/gadget, /lib/modules/5.6.3/kernel/drivers/usb/serial, /lib/modules/5.6.3/kernel/drivers/usb/storage: USB driver-related security risks in device handling and data transfer
43 |   - /lib/modules/5.6.3/kernel/drivers/net/bonding, /lib/modules/5.6.3/kernel/drivers/net/ethernet, /lib/modules/5.6.3/kernel/drivers/net/slip: Network driver-related security risks in packet handling and interface management
44 | 
45 | - Other Issues:
46 |   - XZ compressed data extraction failed at offset 0x9F993F, potentially indicating corrupted or incomplete firmware components
47 |   - /lib: Contains security-relevant binaries without version information or integrity checks
48 | ```
49 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/mikrotik/routeros-7.5-mipsbe/token_usage.jsonl:
--------------------------------------------------------------------------------
  1 | {"input_cost": 0.0015075000000000002, "output_cost": 0.00031, "total_cost": 0.0018175}
  2 | {"input_cost": 0.00442, "output_cost": 0.0006000000000000001, "total_cost": 0.00502}
  3 | {"input_cost": 0.0018075, "output_cost": 0.00031, "total_cost": 0.0071375}
  4 | {"input_cost": 0.004370000000000001, "output_cost": 0.00058, "total_cost": 0.00495}
  5 | {"input_cost": 0.0015925000000000002, "output_cost": 0.00067, "total_cost": 0.0072125}
  6 | {"input_cost": 0.0019150000000000003, "output_cost": 0.0007800000000000001, "total_cost": 0.0026950000000000003}
  7 | {"input_cost": 0.0028225000000000004, "output_cost": 0.0089, "total_cost": 0.0144175}
  8 | {"input_cost": 0.0022075000000000003, "output_cost": 0.0008200000000000001, "total_cost": 0.0030275000000000002}
  9 | {"input_cost": 0.0033475, "output_cost": 0.0022500000000000003, "total_cost": 0.008625}
 10 | {"input_cost": 0.0028175, "output_cost": 0.00084, "total_cost": 0.0036575}
 11 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.0055575}
 12 | {"input_cost": 0.0028325000000000004, "output_cost": 0.00142, "total_cost": 0.0042525}
 13 | {"input_cost": 0.0013925, "output_cost": 0.0008200000000000001, "total_cost": 0.006465}
 14 | {"input_cost": 0.0029425000000000002, "output_cost": 0.00142, "total_cost": 0.0043625}
 15 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.006262500000000001}
 16 | {"input_cost": 0.0029875, "output_cost": 0.0009000000000000001, "total_cost": 0.0038875000000000003}
 17 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.005787500000000001}
 18 | {"input_cost": 0.00319, "output_cost": 0.001, "total_cost": 0.00419}
 19 | {"input_cost": 0.0021375, "output_cost": 0.0013000000000000002, "total_cost": 0.007627500000000001}
 20 | {"input_cost": 0.0044, "output_cost": 0.0009500000000000001, "total_cost": 0.005350000000000001}
 21 | {"input_cost": 0.005240000000000001, "output_cost": 0.00031, "total_cost": 0.010900000000000002}
 22 | {"input_cost": 0.004365, "output_cost": 0.00093, "total_cost": 0.005295}
 23 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.007195}
 24 | {"input_cost": 0.0044875, "output_cost": 0.0008300000000000001, "total_cost": 0.0053175}
 25 | {"input_cost": 0.0018325000000000001, "output_cost": 0.0010400000000000001, "total_cost": 0.00819}
 26 | {"input_cost": 0.004445, "output_cost": 0.00093, "total_cost": 0.0053750000000000004}
 27 | {"input_cost": 0.0034300000000000003, "output_cost": 0.00027, "total_cost": 0.009075}
 28 | {"input_cost": 0.00445, "output_cost": 0.00084, "total_cost": 0.0052899999999999996}
 29 | {"input_cost": 0.00134, "output_cost": 0.00055, "total_cost": 0.00718}
 30 | {"input_cost": 0.004455000000000001, "output_cost": 0.0008900000000000001, "total_cost": 0.005345000000000001}
 31 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.0072450000000000014}
 32 | {"input_cost": 0.004647500000000001, "output_cost": 0.0007400000000000001, "total_cost": 0.005387500000000001}
 33 | {"input_cost": 0.0015325000000000002, "output_cost": 0.00134, "total_cost": 0.00826}
 34 | {"input_cost": 0.00461, "output_cost": 0.0007300000000000001, "total_cost": 0.00534}
 35 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.00724}
 36 | {"input_cost": 0.00502, "output_cost": 0.00092, "total_cost": 0.00594}
 37 | {"input_cost": 0.0017375000000000001, "output_cost": 0.00067, "total_cost": 0.0083475}
 38 | {"input_cost": 0.0055000000000000005, "output_cost": 0.00126, "total_cost": 0.00676}
 39 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.008660000000000001}
 40 | {"input_cost": 0.005505, "output_cost": 0.00101, "total_cost": 0.006515}
 41 | {"input_cost": 0.00231, "output_cost": 0.0034300000000000003, "total_cost": 0.012255}
 42 | {"input_cost": 0.0066925000000000005, "output_cost": 0.0009400000000000001, "total_cost": 0.0076325}
 43 | {"input_cost": 0.0018425000000000002, "output_cost": 0.00216, "total_cost": 0.011635}
 44 | {"input_cost": 0.006860000000000001, "output_cost": 0.0011300000000000001, "total_cost": 0.00799}
 45 | {"input_cost": 0.0033925, "output_cost": 0.0043300000000000005, "total_cost": 0.0157125}
 46 | {"input_cost": 0.0077625, "output_cost": 0.00109, "total_cost": 0.008852500000000001}
 47 | {"input_cost": 0.0019775, "output_cost": 0.00317, "total_cost": 0.014000000000000002}
 48 | {"input_cost": 0.008440000000000001, "output_cost": 0.0015300000000000001, "total_cost": 0.009970000000000001}
 49 | {"input_cost": 0.0035875000000000004, "output_cost": 0.00451, "total_cost": 0.0180675}
 50 | {"input_cost": 0.0098125, "output_cost": 0.00107, "total_cost": 0.0108825}
 51 | {"input_cost": 0.010242500000000002, "output_cost": 0.00031, "total_cost": 0.021435000000000003}
 52 | {"input_cost": 0.009770000000000001, "output_cost": 0.00088, "total_cost": 0.010650000000000001}
 53 | {"input_cost": 0.0021175, "output_cost": 0.00031, "total_cost": 0.013077500000000002}
 54 | {"input_cost": 0.009985, "output_cost": 0.0009000000000000001, "total_cost": 0.010885}
 55 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.012785000000000001}
 56 | {"input_cost": 0.010302500000000001, "output_cost": 0.0010400000000000001, "total_cost": 0.011342500000000002}
 57 | {"input_cost": 0.00235, "output_cost": 0.0024700000000000004, "total_cost": 0.016162500000000003}
 58 | {"input_cost": 0.011302500000000002, "output_cost": 0.0015300000000000001, "total_cost": 0.012832500000000002}
 59 | {"input_cost": 0.001585, "output_cost": 0.0021100000000000003, "total_cost": 0.0165275}
 60 | {"input_cost": 0.011702500000000001, "output_cost": 0.0008, "total_cost": 0.012502500000000001}
 61 | {"input_cost": 0.0015325000000000002, "output_cost": 0.0015, "total_cost": 0.015535000000000002}
 62 | {"input_cost": 0.0056700000000000006, "output_cost": 0.0008500000000000001, "total_cost": 0.006520000000000001}
 63 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.00842}
 64 | {"input_cost": 0.005675, "output_cost": 0.00092, "total_cost": 0.006595}
 65 | {"input_cost": 0.0047375, "output_cost": 0.00031, "total_cost": 0.0116425}
 66 | {"input_cost": 0.0056275000000000006, "output_cost": 0.0010400000000000001, "total_cost": 0.006667500000000001}
 67 | {"input_cost": 0.0015350000000000001, "output_cost": 0.00031, "total_cost": 0.008512500000000001}
 68 | {"input_cost": 0.0069275000000000005, "output_cost": 0.00084, "total_cost": 0.0077675}
 69 | {"input_cost": 0.0015425, "output_cost": 0.00126, "total_cost": 0.01057}
 70 | {"input_cost": 0.006880000000000001, "output_cost": 0.0008900000000000001, "total_cost": 0.007770000000000001}
 71 | {"input_cost": 0.0015475, "output_cost": 0.0011500000000000002, "total_cost": 0.010467500000000001}
 72 | {"input_cost": 0.006835000000000001, "output_cost": 0.0009100000000000001, "total_cost": 0.007745000000000001}
 73 | {"input_cost": 0.0020825, "output_cost": 0.00031, "total_cost": 0.0101375}
 74 | {"input_cost": 0.006797500000000001, "output_cost": 0.0011, "total_cost": 0.0078975}
 75 | {"input_cost": 0.0017400000000000002, "output_cost": 0.0006900000000000001, "total_cost": 0.0103275}
 76 | {"input_cost": 0.00676, "output_cost": 0.00093, "total_cost": 0.007690000000000001}
 77 | {"input_cost": 0.0015400000000000001, "output_cost": 0.0013100000000000002, "total_cost": 0.01054}
 78 | {"input_cost": 0.0067150000000000005, "output_cost": 0.00092, "total_cost": 0.007635}
 79 | {"input_cost": 0.0015450000000000001, "output_cost": 0.0016400000000000002, "total_cost": 0.01082}
 80 | {"input_cost": 0.006670000000000001, "output_cost": 0.0009100000000000001, "total_cost": 0.007580000000000001}
 81 | {"input_cost": 0.0023350000000000003, "output_cost": 0.00099, "total_cost": 0.010905000000000001}
 82 | {"input_cost": 0.006627500000000001, "output_cost": 0.0008600000000000001, "total_cost": 0.007487500000000001}
 83 | {"input_cost": 0.0017300000000000002, "output_cost": 0.0006100000000000001, "total_cost": 0.009827500000000001}
 84 | {"input_cost": 0.006965000000000001, "output_cost": 0.00093, "total_cost": 0.007895000000000001}
 85 | {"input_cost": 0.0015325000000000002, "output_cost": 0.0018300000000000002, "total_cost": 0.011257500000000002}
 86 | {"input_cost": 0.0069125, "output_cost": 0.0009500000000000001, "total_cost": 0.0078625}
 87 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.0097625}
 88 | {"input_cost": 0.006917500000000001, "output_cost": 0.00101, "total_cost": 0.0079275}
 89 | {"input_cost": 0.0015400000000000001, "output_cost": 0.0019500000000000001, "total_cost": 0.0114175}
 90 | {"input_cost": 0.0070575, "output_cost": 0.00088, "total_cost": 0.0079375}
 91 | {"input_cost": 0.0015350000000000001, "output_cost": 0.00031, "total_cost": 0.0097825}
 92 | {"input_cost": 0.0072125, "output_cost": 0.00103, "total_cost": 0.0082425}
 93 | {"input_cost": 0.0015450000000000001, "output_cost": 0.0017200000000000002, "total_cost": 0.0115075}
 94 | {"input_cost": 0.00742, "output_cost": 0.0008900000000000001, "total_cost": 0.00831}
 95 | {"input_cost": 0.0015325000000000002, "output_cost": 0.00158, "total_cost": 0.0114225}
 96 | {"input_cost": 0.0074600000000000005, "output_cost": 0.00099, "total_cost": 0.008450000000000001}
 97 | {"input_cost": 0.0017375000000000001, "output_cost": 0.00176, "total_cost": 0.011947500000000002}
 98 | {"input_cost": 0.0076075000000000005, "output_cost": 0.00099, "total_cost": 0.008597500000000001}
 99 | {"input_cost": 0.0015375, "output_cost": 0.0011500000000000002, "total_cost": 0.011285000000000002}
100 | {"input_cost": 0.007555000000000001, "output_cost": 0.00088, "total_cost": 0.008435000000000002}
101 | {"input_cost": 0.0015350000000000001, "output_cost": 0.00033000000000000005, "total_cost": 0.010300000000000002}
102 | {"input_cost": 0.007505, "output_cost": 0.00103, "total_cost": 0.008535000000000001}
103 | {"input_cost": 0.0033175, "output_cost": 0.00031, "total_cost": 0.012162500000000001}
104 | {"input_cost": 0.007452500000000001, "output_cost": 0.0010400000000000001, "total_cost": 0.0084925}
105 | {"input_cost": 0.0015375, "output_cost": 0.0015600000000000002, "total_cost": 0.01159}
106 | {"input_cost": 0.007620000000000001, "output_cost": 0.00116, "total_cost": 0.008780000000000001}
107 | {"input_cost": 0.001955, "output_cost": 0.00031, "total_cost": 0.011045000000000001}
108 | {"input_cost": 0.007575000000000001, "output_cost": 0.00092, "total_cost": 0.008495}
109 | {"input_cost": 0.001975, "output_cost": 0.00237, "total_cost": 0.01284}
110 | {"input_cost": 0.00742, "output_cost": 0.00022, "total_cost": 0.00764}
111 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/mikrotik/routeros-x86-6.49.6/summary.txt:
--------------------------------------------------------------------------------
 1 | ```
 2 | Firmware Summary:
 3 | [Basic Info]
 4 | - Name/Version: MikroTik RouterOS x86 6.49.6
 5 | - Device/Type/Arch: Router/x86
 6 | - Key Info: Created 2022-04-07, SquashFS v4.0, xz compression
 7 | 
 8 | [Coverage] 
 9 | - Key Dirs: /bndl/advanced-tools, /bndl/dhcp, /bndl/hotspot, /bndl/mpls, /bndl/ppp, /sbin, /etc, /lib
10 | - Key Files: /bin/catlog, webfig files (*.jg.gz), hotspot/login.html, /sbin/sysinit, /sbin/fsck, /sbin/fsck.ext2, /sbin/kexec, /sbin/mke2fs, /sbin/vmcore-dmesg, /etc/passwd, /lib/libcrypto.so.1.0.0, /lib/libssl.so.1.0.0, /lib/ld-uClibc-0.9.33.2.so, /lib/libuClibc-0.9.33.2.so, /lib/libpthread-0.9.33.2.so, /lib/libm-0.9.33.2.so, /lib/libz.so, /lib/libuhttp.so, /lib/libucrypto.so, /lib/libumsg.so, /lib/liburadius.so, /lib/libutil-0.9.33.2.so, /lib/libdl-0.9.33.2.so, /lib/librt-0.9.33.2.so, /lib/libgcc_s.so.1, /lib/libuc++.so
11 | 
12 | [Main Issues]
13 | - Critical Issues: 
14 |   - /bin/catlog: Format string vulnerabilities in main() and sym.str2i_string_const_() functions, allowing arbitrary read/write and potential RCE
15 |   - /sbin/sysinit: Multiple critical vulnerabilities in fcn.0804f792 and fcn.0804aaf8 including lack of stack protection, uncontrolled code execution paths, and memory corruption patterns
16 |   - /sbin/fsck: Stack overflow, format string vulnerabilities, and unprotected printf usage enabling remote code execution and control flow hijacking
17 |   - /sbin/fsck.ext2: Multiple critical vulnerabilities (CVE-2015-1572, CVE-2015-0247, CVE-2007-5497) allowing arbitrary code execution via crafted filesystem images
18 |   - /sbin/fsck.ext2: Stack-based buffer overflows in main function and other critical functions (fcn.08060848, fcn.0806b684, fcn.0806c12e) with no stack canary protection
19 |   - /sbin/mke2fs: Heap-based buffer overflow in fcn.0804afc8, unsafe strcpy usage in fcn.0805000c, and unprotected memory operations in fcn.0804d03d, allowing remote code execution
20 |   - /sbin/vmcore-dmesg: Format string injection in fprintf calls (fcn.08049c40), recursive jump patterns enabling stack exhaustion, and lack of stack canaries, bounds checks, and input validation
21 |   - /etc/passwd: Root user has empty password field (::), allowing unrestricted root access
22 |   - /lib/libcrypto.so.1.0.0: Multiple critical vulnerabilities in OpenSSL 1.0.2 (CVE-2022-2068, CVE-2022-0778, CVE-2021-3712) allowing remote code execution, denial of service, or sensitive data exposure
23 |   - /lib/libssl.so.1.0.0: Critical vulnerabilities including stack buffer overflows, format string vulnerabilities, and insecure cryptographic operations (CVE-2019-1551), enabling remote code execution and cryptographic context compromise
24 |   - /lib/ld-uClibc-0.9.33.2.so: Critical vulnerabilities (CVE-2022-30295, CVE-2022-29503) leading to DNS cache poisoning, memory corruption, and remote code execution
25 |   - /lib/libuClibc-0.9.33.2.so: Multiple critical vulnerabilities (CVE-2022-30295, CVE-2022-29503, CVE-2017-9729, CVE-2017-9728) with exploitable buffer overflows in fcn.000264b8, fcn.0000f4b5, and sym.ttyname_r, allowing remote code execution and privilege escalation
26 |   - /lib/libpthread-0.9.33.2.so: Critical vulnerabilities (CVE-2022-30295, CVE-2022-29503) in uClibc 0.9.33.2, enabling remote code execution and memory corruption
27 |   - /lib/libuhttp.so: Critical vulnerabilities in sym.HttpClient::onData_int__unsigned_int_ (unmonitored gets() call at 0xa3f2), sym.HttpClient::connectAfterResolve__ (missing input validation), and sym.HttpClient::genericRequest_string_const__HttpRequest_const__string__function_void_____ (vulnerable snprintf call at 0x890f), leading to stack overflow and potential EIP overwrite
28 |   - /lib/libucrypto.so: Critical format string vulnerability in sym.BigNum::str___const due to unsafe snprintf usage with user-controlled format parameter and fixed buffer size of 9 bytes, susceptible to exploitation
29 |   - /lib/libumsg.so: Critical vulnerabilities including unprotected strcpy usage in method.nv::Looper (address 162140), dangerous strcpy usage in sym.nv::Logger::connectToLog__ (address 174498), stack buffer overflow in method.nv.getFreeMemory_unsigned_int_ (address 156117), and format string vulnerability in sym.bytes2str_unsigned_long_long_ (address 204625), enabling remote code execution and memory corruption
30 |   - /lib/liburadius.so: Critical format string vulnerability in method.radius.getCodeName_radius::RadiusCode_ (address 14088) due to unvalidated user input passed to printf, enabling arbitrary read/write and remote code execution
31 |   - /lib/libutil-0.9.33.2.so: Critical buffer overflow in sym.openpty function due to unsafe strcpy usage, allowing arbitrary memory overwrite and remote code execution
32 |   - /lib/libdl-0.9.33.2.so: Critical format string vulnerability in sym.dlinfo function due to missing format string validation, direct user input exposure, and presence of %n specifier, enabling arbitrary memory writes and remote code execution
33 |   - /lib/librt-0.9.33.2.so: Critical vulnerabilities including format string vulnerability in fcn.0000196c, buffer overflow, use-after-free, and infinite loop vulnerabilities in fcn.00000f32, and CVE-2021-38604 (NULL pointer dereference)
34 |   - /lib/libgcc_s.so.1: Critical vulnerabilities in sym.__emutls_get_address including unsafe gets() usage, memory corruption patterns, abort-on-failure behavior, and control flow integrity issues
35 |   - /lib/libuc++.so: Multiple critical format string vulnerabilities in functions (sym.operator___ostream__unsigned_int_, sym.operator___ostream__int_, sym.operator___ostream__unsigned_long_long_, sym.operator___ostream__long_long_, sym.IPAddr6::str_bool__const), enabling remote code execution, memory corruption, and protection bypass due to lack of stack canaries, ASLR, and W^X violations
36 | 
37 | - Major Issues: 
38 |   - Web interface files (*.jg.gz): Multiple compressed web interface files with potential for code injection if decompression is mishandled
39 |   - /sbin/kexec: Multiple CVEs affecting kexec version 2.0.12 (CVE-2021-20269, CVE-2015-0267, CVE-2011-3590, CVE-2011-3589, CVE-2011-3588) leading to information disclosure, privilege escalation, or man-in-the-middle attacks
40 |   - /lib/libz.so: Potential vulnerabilities (CVE-2022-37434, CVE-2018-25032, CVE-2005-2096, CVE-2005-1849, CVE-2004-0797) affecting suspected versions 1.2.3 or 3.0, leading to heap-based buffer over-read/overflow, memory corruption, or denial of service
41 |   - /lib/liburadius.so: Dependency on libgcc_s.so.1 with CVE-2022-48422, allowing local privilege escalation via Trojan horse libgcc_s.so.1 in the current working directory
42 | 
43 | - Other Issues: 
44 |   - /bndl/hotspot/home/web/hotspot/login.html: Contains embedded SVG image which could be used for XSS if not properly sanitized
45 |   - /sbin/fsck and /sbin/fsck.ext2: Version exposure (1.40.11, 4.8.2, 3.0) that could aid attackers in targeting known vulnerabilities
46 |   - /sbin/mke2fs: Version exposure (EXT2FS Library version 1.40.11) that could aid attackers in targeting known vulnerabilities
47 |   - /lib/libm-0.9.33.2.so: Potential version exposure (4.8.2) that could aid attackers in targeting known vulnerabilities
48 |   - /lib/libumsg.so: Version information exposure (6.49.3, 1.1, 3.0) and protocol-related strings (HTTP/1.1, l2mtu) detected, aiding vulnerability identification
49 | ```
50 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/mikrotik/routeros-x86-6.49.6/token_usage.jsonl:
--------------------------------------------------------------------------------
 1 | {"input_cost": 0.0015075000000000002, "output_cost": 0.00134, "total_cost": 0.0028475}
 2 | {"input_cost": 0.004557500000000001, "output_cost": 0.0007800000000000001, "total_cost": 0.005337500000000001}
 3 | {"input_cost": 0.0017825000000000002, "output_cost": 0.00321, "total_cost": 0.010330000000000002}
 4 | {"input_cost": 0.0019375000000000002, "output_cost": 0.0008300000000000001, "total_cost": 0.0027675000000000004}
 5 | {"input_cost": 0.002265, "output_cost": 0.0027400000000000002, "total_cost": 0.007772500000000002}
 6 | {"input_cost": 0.0030550000000000004, "output_cost": 0.00101, "total_cost": 0.004065000000000001}
 7 | {"input_cost": 0.002, "output_cost": 0.0031300000000000004, "total_cost": 0.009195000000000002}
 8 | {"input_cost": 0.0031225000000000003, "output_cost": 0.0009400000000000001, "total_cost": 0.0040625}
 9 | {"input_cost": 0.004125, "output_cost": 0.006390000000000001, "total_cost": 0.0145775}
10 | {"input_cost": 0.0064875, "output_cost": 0.00022, "total_cost": 0.0067075}
11 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/openwrt/fbecd0858ac36049e04bf9dd8acd3dd53fed97b4/summary.txt:
--------------------------------------------------------------------------------
 1 | ```
 2 | Firmware Summary:
 3 | [Basic Info]
 4 | - Name/Version: OpenWrt Linux-4.19.69
 5 | - Device/Type/Arch: MIPS32
 6 | - Key Info: Release date: 2019-09-05, Kernel version: 4.19.69, BusyBox version: 1.31.0
 7 | 
 8 | [Coverage] 
 9 | - Key Dirs: /bin, /etc/board.d, /sbin, /etc, /lib, /usr/bin, /usr/sbin, /usr/lib, /lib/wifi, /etc/rc.button
10 | - Key Files: /bin/busybox, /bin/uclient-fetch, /bin/board_detect, /bin/config_generate, /sbin/procd, /sbin/netifd, /sbin/ubusd, /sbin/uci, /etc/profile, /etc/device_info, /etc/banner, /etc/services, /etc/shadow, /lib/libc.so, /lib/functions.sh, /lib/libfstools.so, /lib/libvalidate.so, /etc/config/dropbear, /etc/config/dhcp, /usr/bin/fwtool, /usr/bin/usign, /usr/sbin/dnsmasq, /usr/sbin/dropbear, /usr/sbin/odhcpd, /usr/sbin/wpad, /usr/sbin/iw, /usr/sbin/odhcp6c, /usr/sbin/pppd, /usr/sbin/xtables-legacy-multi, /usr/lib/libip4tc.so.2.0.0, /usr/lib/libip6tc.so.2.0.0, /usr/lib/libiptext4.so, /usr/lib/libjson-c.so.4.0.0, /usr/lib/libxtables.so.12.2.0, /lib/network/config.sh, /lib/wifi/mac80211.sh, /usr/lib/pppd/2.4.7/rp-pppoe.so, /etc/rc.button/failsafe, /etc/rc.button/reset, /etc/rc.button/rfkill, /etc/rc.button/wps
11 | 
12 | [Main Issues]
13 | - Critical Issues: 
14 |   - /bin/busybox: Multiple critical vulnerabilities (CVE-2022-48174, CVE-2022-30065, CVE-2022-28391) including stack buffer overflow, use-after-free, and arbitrary code execution. Lacks ASLR/PIE protection, has writable GOT, and contains direct '/bin/sh' string without validation.
15 |   - /sbin/netifd: Critical stack-based buffer overflow in entry0 function due to use of vulnerable 'gets' function. Lacks stack canary protection, has executable stack (NX-bit disabled), and no PIC, enabling shellcode execution and control flow hijacking.
16 |   - /sbin/ubusd: Critical vulnerabilities including register-controlled execution flow enabling ROP chain construction via stack buffer overflow, RWX memory segment allowing self-modifying code and runtime unpacking. No stack canary, ASLR, or W^X protections detected.
17 |   - /lib/libfstools.so: Two critical command injection vulnerabilities in sym.jffs2_switch and sym.fopivot functions via uncontrolled format strings and unvalidated user input in system() calls, enabling full root command execution.
18 |   - /etc/shadow: Empty root password hash (::) detected, allowing unrestricted root access to the system.
19 |   - /etc/config/dropbear: Insecure SSH configuration with password authentication enabled for both regular users and root ('PasswordAuth' and 'RootPasswordAuth' set to 'on'), exposing the system to brute-force attacks. Default SSH port 22 in use.
20 |   - /usr/sbin/dnsmasq: Multiple critical vulnerabilities in version 2.80 (CVE-2020-25687, CVE-2020-25683, CVE-2020-25682, CVE-2020-25681, CVE-2020-25684, CVE-2020-25685, CVE-2020-25686, CVE-2017-14491, CVE-2017-14492, CVE-2017-14493) including heap-based buffer overflows, DNS cache poisoning, and remote code execution.
21 |   - /usr/sbin/dropbear: Critical vulnerabilities including CVE-2023-48795 (Terrapin attack) and CVE-2017-9078 (post-authentication root RCE), exposing SSH server to integrity bypass and remote code execution.
22 |   - /usr/sbin/wpad: Critical stack-based buffer overflow in function fcn.00418020 due to unvalidated HTTP request input, enabling remote code execution. Multiple CVEs affecting hostapd/wpa_supplicant v2.7 (CVE-2019-9499, CVE-2019-9498, CVE-2019-9497, CVE-2019-9496, CVE-2019-9495, CVE-2019-9494) including authentication bypass and side-channel attacks. Vulnerable SAE/EAP-PWD configurations detected.
23 |   - /usr/sbin/pppd: Critical insecure debug logging configuration with 'show-password' enabled, exposing credentials in debug logs. Sensitive content (password=, user=) detected without proper protection, and 'hide-password' disabled by default, increasing credential exposure risk.
24 |   - /usr/lib/libxtables.so.12.2.0: Critical vulnerabilities in sym.xtables_numeric_to_ip6addr (missing stack protections, buffer overflow) and fcn.000026a0 (fixed-size buffer with unbounded input), enabling unauthenticated RCE and privilege escalation.
25 |   - /usr/lib/dnsmasq/dhcp-script.sh: Critical arbitrary code execution vulnerability via uncontrolled sourcing of external script through $USER_DHCPSCRIPT environment variable, enabling privilege escalation if the variable is attacker-controlled.
26 |   - /lib/network/config.sh: Critical insecure handling of network interface configuration and ubus calls. The 'ubus_call' function does not validate or sanitize its inputs, which could lead to injection attacks if the input is controlled by an attacker.
27 |   - /lib/wifi/mac80211.sh: Critical insecure default wireless configuration with default SSID 'OpenWrt' and no encryption (encryption=none), exposing the network to unauthorized access and potential attacks.
28 |   - /etc/rc.button/failsafe: Critical insecure file handling, writing environment variable ${BUTTON} to /tmp/failsafe_button without validation or sanitization, potentially leading to file manipulation or injection attacks.
29 |   - /etc/rc.button/reset: Critical insecure command execution, executing `reboot` and `jffs2reset -y` without proper input validation, potentially leading to unintended system resets or factory resets.
30 |   - /etc/rc.button/wps: Critical insecure handling of WPS credentials and potential command injection risk. The script processes WPS credentials using `ubus` calls without proper validation or sanitization, dynamically constructing JSON payloads with user-supplied input (`ssid`, `key`, `encryption`), which could be exploited for command injection or JSON injection.
31 | 
32 | - Major Issues:
33 |   - /bin/config_generate: Multiple instances of hardcoded credentials in network configuration (username='username', password='password') for PPPoE and general network settings, exposing sensitive authentication data.
34 |   - /bin/uclient-fetch: Hardcoded credentials detected with string 'password=<password>'
35 |   - /lib/functions.sh: Insecure file handling and command injection risk in user_add and group_add functions due to direct manipulation of /etc/passwd, /etc/shadow, and /etc/group without proper input validation or sanitization.
36 |   - /lib/libc.so: CVE-2019-14697 vulnerability in musl libc version 1.1.23 (x87 floating-point stack adjustment imbalance) and potential sensitive credential exposure with hashed string '$1$abcd0123$9Qcg8DyviekV3tDGMZynJ1'.
37 |   - /etc/banner: Firmware version information exposure ('OpenWrt SNAPSHOT, r10956-62dbe361a1') enabling targeted attacks against known vulnerabilities.
38 |   - /etc/config/dhcp: Internal network configuration exposure including DNS settings, DHCP lease file paths, and interface bindings, potentially revealing network structure and attack vectors.
39 |   - /usr/lib/libjson-c.so.4.0.0: Potential version exposure detected, with version-related strings like 'json_c_version' and 'json_c_version_num', but no explicit version number found. Medium-severity issue as it could aid attackers in identifying vulnerabilities.
40 |   - /usr/lib/pppd/2.4.7/rp-pppoe.so: Version information exposure through strings 'RP-PPPoE plugin version %s compiled against pppd %s', potentially aiding attackers in identifying vulnerabilities.
41 |   - /etc/rc.button/rfkill: Major insecure configuration handling in wireless settings, modifying wireless configuration using 'uci set' and 'uci commit' without explicit validation or sanitization of input, potentially leading to insecure configurations.
42 | 
43 | - Other Issues:
44 |   - /bin/busybox: Potential improper handling of sensitive system files (/etc/passwd, /etc/shadow)
45 |   - /sbin/procd: Embedded version string 'r1gGa' detected, potentially exposing version information to attackers
46 |   - /etc/device_info: Device information exposure (manufacturer, product, revision) could aid reconnaissance efforts
47 |   - /usr/sbin/iw: Version information exposure through version-related strings in executable
48 | ```
49 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/openwrt/fbecd0858ac36049e04bf9dd8acd3dd53fed97b4/token_usage.jsonl:
--------------------------------------------------------------------------------
 1 | {"input_cost": 0.0013800000000000002, "output_cost": 0.0017400000000000002, "total_cost": 0.0031200000000000004}
 2 | {"input_cost": 0.0037375000000000004, "output_cost": 0.0007400000000000001, "total_cost": 0.004477500000000001}
 3 | {"input_cost": 0.0021775, "output_cost": 0.0021100000000000003, "total_cost": 0.008765000000000002}
 4 | {"input_cost": 0.0020325, "output_cost": 0.00084, "total_cost": 0.0028725}
 5 | {"input_cost": 0.00476, "output_cost": 0.0023000000000000004, "total_cost": 0.0099325}
 6 | {"input_cost": 0.0025775000000000004, "output_cost": 0.0009600000000000001, "total_cost": 0.0035375000000000007}
 7 | {"input_cost": 0.0027900000000000004, "output_cost": 0.00804, "total_cost": 0.014367500000000002}
 8 | {"input_cost": 0.0031875000000000002, "output_cost": 0.00107, "total_cost": 0.0042575}
 9 | {"input_cost": 0.00269, "output_cost": 0.0031200000000000004, "total_cost": 0.0100675}
10 | {"input_cost": 0.0037725000000000002, "output_cost": 0.00092, "total_cost": 0.0046925000000000005}
11 | {"input_cost": 0.0014775, "output_cost": 0.0009000000000000001, "total_cost": 0.007070000000000001}
12 | {"input_cost": 0.0040175, "output_cost": 0.0009000000000000001, "total_cost": 0.0049175}
13 | {"input_cost": 0.00134, "output_cost": 0.00062, "total_cost": 0.0068775}
14 | {"input_cost": 0.0040750000000000005, "output_cost": 0.0008200000000000001, "total_cost": 0.004895000000000001}
15 | {"input_cost": 0.0024325, "output_cost": 0.0022900000000000004, "total_cost": 0.009617500000000001}
16 | {"input_cost": 0.004365, "output_cost": 0.0008500000000000001, "total_cost": 0.005215}
17 | {"input_cost": 0.0030150000000000003, "output_cost": 0.00318, "total_cost": 0.01141}
18 | {"input_cost": 0.005785, "output_cost": 0.00097, "total_cost": 0.006755000000000001}
19 | {"input_cost": 0.0013950000000000002, "output_cost": 0.00107, "total_cost": 0.00922}
20 | {"input_cost": 0.0056375, "output_cost": 0.00103, "total_cost": 0.0066675}
21 | {"input_cost": 0.0025775000000000004, "output_cost": 0.00513, "total_cost": 0.014375}
22 | {"input_cost": 0.006045000000000001, "output_cost": 0.00125, "total_cost": 0.007295000000000001}
23 | {"input_cost": 0.0015175000000000002, "output_cost": 0.0012300000000000002, "total_cost": 0.010042500000000001}
24 | {"input_cost": 0.006027500000000001, "output_cost": 0.0013200000000000002, "total_cost": 0.007347500000000001}
25 | {"input_cost": 0.00134, "output_cost": 0.0006100000000000001, "total_cost": 0.0092975}
26 | {"input_cost": 0.0060175, "output_cost": 0.00126, "total_cost": 0.0072775}
27 | {"input_cost": 0.002735, "output_cost": 0.0034900000000000005, "total_cost": 0.0135025}
28 | {"input_cost": 0.005307500000000001, "output_cost": 0.0013100000000000002, "total_cost": 0.006617500000000001}
29 | {"input_cost": 0.00134, "output_cost": 0.0005700000000000001, "total_cost": 0.0085275}
30 | {"input_cost": 0.00529, "output_cost": 0.0011200000000000001, "total_cost": 0.006410000000000001}
31 | {"input_cost": 0.0014075000000000001, "output_cost": 0.00032, "total_cost": 0.0081375}
32 | {"input_cost": 0.005385, "output_cost": 0.00093, "total_cost": 0.006315}
33 | {"input_cost": 0.00134, "output_cost": 0.0005600000000000001, "total_cost": 0.008215}
34 | {"input_cost": 0.005365000000000001, "output_cost": 0.0011500000000000002, "total_cost": 0.006515000000000001}
35 | {"input_cost": 0.0014025, "output_cost": 0.00031, "total_cost": 0.0082275}
36 | {"input_cost": 0.005497500000000001, "output_cost": 0.00099, "total_cost": 0.0064875}
37 | {"input_cost": 0.00134, "output_cost": 0.00058, "total_cost": 0.0084075}
38 | {"input_cost": 0.0054800000000000005, "output_cost": 0.00088, "total_cost": 0.00636}
39 | {"input_cost": 0.0014075000000000001, "output_cost": 0.00031, "total_cost": 0.0080775}
40 | {"input_cost": 0.005615, "output_cost": 0.0011500000000000002, "total_cost": 0.006765}
41 | {"input_cost": 0.00134, "output_cost": 0.0006000000000000001, "total_cost": 0.008705000000000001}
42 | {"input_cost": 0.0056300000000000005, "output_cost": 0.0011500000000000002, "total_cost": 0.0067800000000000004}
43 | {"input_cost": 0.0014750000000000002, "output_cost": 0.00029, "total_cost": 0.008545}
44 | {"input_cost": 0.005775000000000001, "output_cost": 0.0007400000000000001, "total_cost": 0.006515000000000001}
45 | {"input_cost": 0.00184, "output_cost": 0.00076, "total_cost": 0.009115000000000002}
46 | {"input_cost": 0.005755000000000001, "output_cost": 0.00092, "total_cost": 0.006675}
47 | {"input_cost": 0.0013975, "output_cost": 0.0014500000000000001, "total_cost": 0.0095225}
48 | {"input_cost": 0.0057375, "output_cost": 0.001, "total_cost": 0.0067375}
49 | {"input_cost": 0.00134, "output_cost": 0.00059, "total_cost": 0.0086675}
50 | {"input_cost": 0.005752500000000001, "output_cost": 0.00107, "total_cost": 0.0068225000000000004}
51 | {"input_cost": 0.0014700000000000002, "output_cost": 0.00031, "total_cost": 0.0086025}
52 | {"input_cost": 0.0057375, "output_cost": 0.0007300000000000001, "total_cost": 0.0064675}
53 | {"input_cost": 0.0016950000000000001, "output_cost": 0.0027300000000000002, "total_cost": 0.0108925}
54 | {"input_cost": 0.006355, "output_cost": 0.0007800000000000001, "total_cost": 0.007135000000000001}
55 | {"input_cost": 0.009120000000000001, "output_cost": 0.00031, "total_cost": 0.016565000000000003}
56 | {"input_cost": 0.006325000000000001, "output_cost": 0.00022, "total_cost": 0.0065450000000000005}
57 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/openwrt/openwrtSample/report.txt:
--------------------------------------------------------------------------------
  1 | '''
  2 | - [Location] bin/busybox
  3 | - [Type] Component
  4 | - [Version Info] BusyBox 1.28.4, CVE-2021-42381, CVE-2021-42380, CVE-2021-42379, CVE-2021-42378, CVE-2021-42377
  5 | - [Description] Multiple critical and high severity vulnerabilities found in the awk applet of BusyBox.
  6 | - [Details] Use-after-free issues in the awk applet allow remote code execution. CVE-2021-42377 also highlights command injection risks due to mishandling of shell commands.
  7 | - [Impact] Potential remote code execution and command injection attacks.
  8 | - [Risk Level] Critical
  9 | 
 10 | - [Location] bin/opkg
 11 | - [Type] Component
 12 | - [Version Info] Unknown
 13 | - [Description] Critical security issues identified in sym.remove_maintainer_scripts and sym.pkg_dest_init functions.
 14 | - [Details] Lack of input validation and use of insecure functions like sym_sprintf_alloc lead to format string vulnerabilities and arbitrary code execution risks. sym.pkg_dest_init handles configuration files without sanitization.
 15 | - [Impact] Arbitrary code execution and memory corruption risks.
 16 | - [Risk Level] Critical
 17 | 
 18 | - [Location] bin/uclient-fetch
 19 | - [Type] Component/Credential
 20 | - [Version Info] Unknown
 21 | - [Description] Sensitive content and critical vulnerabilities detected.
 22 | - [Details] Embedded HTTP authentication password parameter (--password=<password>) poses credential exposure risk. Function pointer execution without validation (sym.imp.getenv) and unvalidated parameters passed to memcpy via sym.imp.uclient_set_proxy_url could lead to memory corruption or remote code execution.
 23 | - [Impact] Potential credential exposure and remote code execution/memory corruption.
 24 | - [Risk Level] Critical
 25 | 
 26 | - [Location] bin/config_generate
 27 | - [Type] Configuration/Credential
 28 | - [Version Info] Unknown
 29 | - [Description] Hardcoded default credentials and insecure configurations.
 30 | - [Details] Default password 'password' embedded. Default IP addresses (e.g., 192.168.1.1), subnet masks, NTP servers ('0.openwrt.pool.ntp.org'), and hostname ('OpenWrt') are hardcoded. PPPoE network configurations include default username 'username' and password 'password'.
 31 | - [Impact] Unauthorized access due to easily guessable credentials and potential fingerprinting of the system.
 32 | - [Risk Level] High
 33 | '''
 34 | '''
 35 | - [Location] sbin/init
 36 | - [Type] Component
 37 | - [Version Info] Unknown
 38 | - [Description] Potential exposure of debug functionality and insecure use of 'chroot'.
 39 | - [Details] The binary contains references to 'init_debug' and '/tmp/debug_level', indicating possible debug functionality. Additionally, improper implementation of 'chroot' without privilege dropping could lead to privilege escalation.
 40 | - [Impact] Exposure of sensitive information or privilege escalation if misconfigured.
 41 | - [Risk Level] Medium
 42 | 
 43 | - [Location] sbin/init
 44 | - [Type] Component
 45 | - [Version Info] Unknown
 46 | - [Description] Dependency on potentially outdated or vulnerable shared libraries.
 47 | - [Details] The binary depends on libraries such as 'libubox.so', 'libubus.so', and 'libjson-c.so.2'. Outdated versions of these libraries may contain known vulnerabilities.
 48 | - [Impact] Possible exploitation of library vulnerabilities leading to system compromise.
 49 | - [Risk Level] Medium
 50 | 
 51 | - [Location] sbin/init
 52 | - [Type] Component
 53 | - [Version Info] Unknown
 54 | - [Description] Critical security risks in function fcn.004019d4 due to improper handling of sensitive operations.
 55 | - [Details] Function constructs and executes commands using hardcoded strings ('/bin/sh', '/etc/preinit') without input validation, allowing potential command injection.
 56 | - [Impact] Remote code execution or privilege escalation through malicious payloads.
 57 | - [Risk Level] Critical
 58 | 
 59 | - [Location] sbin/mtd
 60 | - [Type] Component
 61 | - [Version Info] Version 2.0, CVE-2016-9092
 62 | - [Description] Cross-site request forgery (CSRF) vulnerability in the Mail Threat Defense (MTD) management console.
 63 | - [Details] CVE-2016-9092 allows unauthorized actions using an authenticated administrator's privileges.
 64 | - [Impact] Unauthorized configuration changes or actions by attackers.
 65 | - [Risk Level] High
 66 | 
 67 | - [Location] sbin/mtd
 68 | - [Type] Component
 69 | - [Version Info] Unknown
 70 | - [Description] Critical risk identified in disassembly analysis.
 71 | - [Details] Unconditional jump to insecure system call at 0x400f84, combined with lack of identifiable callers for sym.imp.sscanf and handling of 'str.unlock'.
 72 | - [Impact] Potential remote code execution or command injection.
 73 | - [Risk Level] Critical
 74 | 
 75 | - [Location] sbin/netifd
 76 | - [Type] Component
 77 | - [Version Info] OpenWrt versions prior to 19.07.7, CVE-2021-22161
 78 | - [Description] Routing loop vulnerability when IPv6 is used.
 79 | - [Details] CVE-2021-22161 describes a routing loop condition leading to excessive network traffic.
 80 | - [Impact] Network performance degradation or denial of service.
 81 | - [Risk Level] High
 82 | 
 83 | - [Location] sbin/netifd
 84 | - [Type] Component
 85 | - [Version Info] Unknown
 86 | - [Description] Critical vulnerabilities in disassembly analysis.
 87 | - [Details] Format string vulnerability in fprintf, unvalidated input passed to recv, and memcpy with attacker-controllable parameters.
 88 | - [Impact] Remote code execution, memory corruption, or buffer overflow attacks.
 89 | - [Risk Level] Critical
 90 | 
 91 | - [Location] sbin/rpcd
 92 | - [Type] Component
 93 | - [Version Info] Unknown
 94 | - [Description] Critical vulnerabilities in RPC handling functions.
 95 | - [Details] Insecure printf/asprintf calls with user-controlled inputs and format string vulnerabilities.
 96 | - [Impact] Remote code execution or system compromise via malicious RPC inputs.
 97 | - [Risk Level] Critical
 98 | 
 99 | - [Location] sbin/rpcd
100 | - [Type] Credential
101 | - [Version Info] Unknown
102 | - [Description] Sensitive keyword exposure.
103 | - [Details] Presence of keywords 'password' and 'keys' suggests potential sensitive data handling.
104 | - [Impact] Unauthorized access or credential leakage if improperly managed.
105 | - [Risk Level] Medium
106 | 
107 | - [Location] sbin/logread
108 | - [Type] Configuration
109 | - [Version Info] Unknown
110 | - [Description] Potential exposure of operational parameters.
111 | - [Details] Pattern 'u0fcs:l:r:F:p:S:P:h:e:t' indicates embedded sensitive configuration data.
112 | - [Impact] Exposure of operational details or sensitive configurations.
113 | - [Risk Level] Medium
114 | 
115 | - [Location] sbin/uci
116 | - [Type] Component
117 | - [Version Info] Affected by CVE-2017-17867
118 | - [Description] Known vulnerability allowing arbitrary OS command execution.
119 | - [Details] CVE-2017-17867 allows authenticated users to execute commands via manipulation of configuration fields.
120 | - [Impact] Arbitrary command execution through insecure configuration handling.
121 | - [Risk Level] High
122 | 
123 | - [Location] sbin/uci
124 | - [Type] Component
125 | - [Version Info] Unknown
126 | - [Description] Critical security issue due to insecure use of 'sscanf'.
127 | - [Details] Lack of input validation for 'sscanf' increases risk of buffer overflow or format string vulnerabilities.
128 | - [Impact] Possible remote code execution or system compromise.
129 | - [Risk Level] Critical
130 | 
131 | - [Location] sbin/wifi
132 | - [Type] Credential
133 | - [Version Info] Unknown
134 | - [Description] Potential exposure of WiFi WEP keys.
135 | - [Details] Script includes logic for preparing WEP keys, which are inherently insecure.
136 | - [Impact] Exposure of sensitive key material if improperly handled.
137 | - [Risk Level] Medium
138 | 
139 | - [Location] sbin/hotplug-call
140 | - [Type] Component
141 | - [Version Info] Unknown
142 | - [Description] Exposure of privileged environment variables.
143 | - [Details] Script exports USER=root and LOGNAME=root, posing a risk of privilege misuse.
144 | - [Impact] Privilege escalation or misuse during execution of external scripts.
145 | - [Risk Level] Medium
146 | 
147 | - [Location] sbin/hotplug-call
148 | - [Type] Component
149 | - [Version Info] Unknown
150 | - [Description] Execution of unvalidated scripts from /etc/hotplug.d/$1.
151 | - [Details] Script sources all scripts in the directory without integrity or permission checks.
152 | - [Impact] Remote code execution if an attacker places a malicious script in the directory.
153 | - [Risk Level] Critical
154 | '''
155 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/openwrt/openwrtSample/summary.txt:
--------------------------------------------------------------------------------
 1 | '''
 2 | Firmware Summary:
 3 | [Basic Info]
 4 | - Name/Version: Firmware version 1.28.4 (BusyBox)
 5 | - Device/Type/Arch: Generic embedded device, SquashFS file system
 6 | - Key Info: Kernel version/release date unknown; firmware created on 2019-06-27.
 7 | 
 8 | [Coverage] 
 9 | - Key Dirs: /bin, /sbin, /www/luci-static/resources
10 | - Key Files: /bin/busybox, /bin/opkg, /bin/uclient-fetch, /bin/config_generate, /sbin/init, /sbin/mtd, /sbin/netifd, /sbin/rpcd, /sbin/uci, /sbin/wifi, /sbin/hotplug-call
11 | 
12 | [Main Issues]
13 | - Critical Issues:
14 |   - /bin/busybox: Multiple use-after-free vulnerabilities in the awk applet (CVE-2021-42381, CVE-2021-42380, CVE-2021-42379, CVE-2021-42378, CVE-2021-42377) allow remote code execution.
15 |   - /bin/opkg: Format string vulnerabilities in sym.remove_maintainer_scripts and sym.pkg_dest_init due to lack of input validation via sym_sprintf_alloc and sprintf_alloc misuse.
16 |   - /bin/uclient-fetch: Function pointer execution without validation (sym.imp.getenv) and unvalidated memcpy parameters (via sym.imp.uclient_set_proxy_url) risk memory corruption and remote code execution.
17 |   - /sbin/init: Improper handling of sensitive operations in fcn.004019d4, including command injection risks via unsanitized inputs to '/bin/sh' and '/etc/preinit'.
18 |   - /sbin/mtd: Unconditional jump to insecure system call at 0x400f84 and dynamic invocation of sym.imp.sscanf without identifiable static callers, risking remote code execution (CVE-2016-9092).
19 |   - /sbin/netifd: Format string vulnerability in fprintf (0x402854), unvalidated recv input (0x402894 via nl_recvmsgs), and memcpy with attacker-controlled parameters (0x4025c4) expose the binary to arbitrary code execution and buffer overflows (CVE-2021-22161).
20 |   - /sbin/rpcd: Format string vulnerabilities and insecure use of asprintf/sprintf (e.g., 0x402208, 0x401f58) propagate user-controlled inputs without sanitization, allowing potential remote code execution or buffer overflow attacks.
21 |   - /sbin/uci: Insecure use of sscanf (0x400f30) without input validation exposes the binary to buffer overflow or format string vulnerabilities. Known vulnerability CVE-2017-17867 allows authenticated users to execute arbitrary OS commands via the leasetrigger field.
22 |   - /sbin/hotplug-call: Dynamic execution of scripts in /etc/hotplug.d/$1 without integrity checks allows arbitrary code execution if an attacker places a malicious script in the directory.
23 | 
24 | - Major Issues:
25 |   - /sbin/wifi: Exposure of WEP keys due to outdated protocol usage and improper key handling logic increases the risk of credential compromise.
26 |   - /sbin/hotplug-call: Exporting privileged environment variables (USER=root, LOGNAME=root) during execution poses a privilege escalation risk if misused by external scripts.
27 |   - /bin/uclient-fetch: Embedded HTTP authentication password parameter (--password=<password>) risks accidental credential exposure if misused or logged.
28 |   - /sbin/init: Potential insecure use of 'chroot' functionality with error messages indicating improper implementation, risking privilege escalation.
29 |   - /sbin/logread: Sensitive operational flags or parameters (e.g., 'u0fcs:l:r:F:p:S:P:h:e:t') may expose configuration details if misused.
30 |   - /bin/config_generate: Default IP configurations (e.g., 192.168.1.1), hardcoded NTP servers ('0.openwrt.pool.ntp.org'), and generic hostname ('OpenWrt') could expose the device to fingerprinting or exploitation if not modified during deployment.
31 | 
32 | - Other Issues:
33 |   - /bin/config_generate: Hardcoded default PPPoE credentials ('username'/'password') and a default password ('password') for network configurations pose significant risks of unauthorized access if unchanged.
34 |   - /sbin/init: Presence of 'init_debug' and '/tmp/debug_level' may expose sensitive debug information if improperly secured.
35 |   - /sbin/rpcd: Keywords like 'password' and 'keys' suggest potential presence of hardcoded credentials or cryptographic keys, posing a security risk if improperly managed.
36 | 
37 | [Attack Surface]
38 | - Attack Points: Vulnerabilities in /bin/busybox, /bin/opkg, /bin/uclient-fetch, /sbin/init, /sbin/mtd, /sbin/netifd, /sbin/rpcd, /sbin/uci, /sbin/logread, /bin/config_generate, /sbin/wifi, and /sbin/hotplug-call expose the system to remote code execution, command injection, memory corruption, privilege escalation, and unauthorized access attacks via malicious inputs, environment manipulation, or default credential exploitation.
39 | '''
40 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/summary_example.md:
--------------------------------------------------------------------------------
 1 | # 🔍 OpenWrt Firmware Security Analysis
 2 | > Comprehensive security assessment of OpenWrt Linux-4.19.69 MIPS32 firmware
 3 | 
 4 | ##  Executive Summary
 5 | 
 6 | | Category | Details |
 7 | |----------|---------|
 8 | | **Firmware** | OpenWrt Linux-4.19.69 |
 9 | | **Architecture** | MIPS32 |
10 | | **Release Date** | 2019-09-05 |
11 | 
12 | ##  Critical Security Vulnerabilities
13 | 
14 | ### System Components
15 | | Component | Version | Key Vulnerabilities |
16 | |-----------|---------|-------------------|
17 | | BusyBox | 1.31.0 | CVE-2022-48174, CVE-2022-30065, CVE-2022-28391 |
18 | | GLIBC | 2.0 | CVE-2022-23218, CVE-2021-3999, CVE-2015-0235 |
19 | | dnsmasq | < 2.83 | CVE-2020-25684, CVE-2020-25683, CVE-2020-25682 |
20 | | hostapd/wpa_supplicant | 2.7 | CVE-2019-9499 through CVE-2019-9494 |
21 | 
22 | ### Authentication & Access Control
23 | - Empty root password hash in `/etc/shadow`
24 | - Hardcoded network passwords
25 | - Clear-text password exposure in `uclient-fetch`
26 | - Insecure `/etc/passwd` and `/etc/shadow` manipulation
27 | 
28 | ### Network Security
29 | -  DNS cache poisoning vulnerabilities
30 | -  MITM package injection risk (CVE-2020-7982)
31 | -  Insecure firmware upgrade process
32 | -  Multiple WPA authentication bypass vectors
33 | 
34 | ### Kernel Module Vulnerabilities
35 | | Module | Vulnerabilities |
36 | |--------|----------------|
37 | | ip_tables.ko | Buffer overflow, RCE risks |
38 | | nf_nat.ko | Stack corruption, kernel execution |
39 | | mac80211.ko | CVE-2014-8709, CVE-2014-2706 |
40 | | usbcore.ko | Spectre vulnerability (CVE-2019-15902) |
41 | 
42 | 
43 | 
44 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/tp-link/TL-IPC55x_P_-x_2.0/summary.txt:
--------------------------------------------------------------------------------
 1 | '''
 2 | Firmware Summary:
 3 | [Basic Info]
 4 | - Name/Version: TL-IPC55x_P_-x_2.0
 5 | - Device/Type/Arch: TP-Link IPC55x, ARM architecture
 6 | - Key Info: Kernel version 3.4.35, Squashfs filesystem, Build date 2017-04-20
 7 | 
 8 | [Coverage] 
 9 | - Key Dirs: /bin, /etc, /sbin, /usr/bin, /lib
10 | - Key Files: bin/busybox, bin/ipcd, bin/cloud-client, bin/dn_switch, bin/ubus, bin/opkg, bin/login.sh, bin/onvif, bin/tddpd, bin/vda, bin/wtd, sbin/netifd, sbin/ubusd, sbin/checkipconflict, sbin/uci, sbin/sysupgrade, sbin/luci-reload, sbin/wget2nand, sbin/wifi, sbin/hotplug2, sbin/mount_root, etc/opkg.conf, etc/passwd, etc/shadow, etc/diag.sh, etc/group, etc/relayd.conf, etc/sysctl.conf, etc/hk_proto_config, etc/banner, etc/openwrt_release, etc/openwrt_version, etc/profile, etc/protocols, etc/services, etc/usr_conf_data, etc/tddpd/priv-key.pem, lib/ld-uClibc.so.0, lib/libcyassl.so, lib/libcyassl.so.5, lib/libcrypt.so.0, lib/libevent-2.0.so.5, lib/libpng12.so.0, lib/libqrencode.so, lib/libuci.so, lib/libpthread-0.9.32.1.so, lib/libpthread.so.0, lib/TL-IPC555V2-6.ini, lib/functions.sh, lib/libresolv-0.9.32.1.so, lib/libutil-0.9.32.1.so, lib/libc.so.0, lib/libdl.so.0, lib/libm.so.0, lib/libthread_db-0.9.32.1.so, lib/librt-0.9.32.1.so, lib/librt.so.0, lib/TL-IPC553V2-4.ini, lib/TL-IPC553V2-6.ini, lib/TL-IPC553V2-8.ini, lib/TL-IPC555V2-8.ini, lib/libdecrypter.so, lib/libmsglog.so, lib/libblobmsg_json.so, lib/libubus.so
11 | 
12 | [Main Issues]
13 | - Critical Issues:
14 |   - /etc/init.d/cfgdev_info: Lack of input validation for DEV_NAME and HW_VER allows command injection via untrusted inputs from 'tddpServer'; hardcoded UUID (8857c040-49cb-4e6e-b0cd-2148cf3e07c2) exposes sensitive device identification data.
15 |   - /etc/init.d/uhttpd: Potential exposure of SSL/TLS private key (/etc/uhttpd.key) and certificate (/etc/uhttpd.crt) due to improper file permissions; risks unauthorized decryption of sensitive data.
16 |   - /lib/libubus.so: Format string vulnerability in sym.ubus_strerror and buffer overflow risks in fcn.00001534 and fcn.0000333c from unchecked memcpy; use-after-free potential in sym.ubus_complete_request (GCC 4.8.3, CVE-2018-12886).
17 |   - /lib/libdecrypter.so: RSA private key handling functions expose sensitive cryptographic operations.
18 |   - /lib/libmsglog.so: Known GCC 4.8.3 vulnerabilities (CVE-2018-12886, CVE-2017-11671, CVE-2015-5276) enable stack protector bypass and buffer overflow risks.
19 |   - /lib/libblobmsg_json.so: Lack of input validation and insecure function usage (e.g., sprintf, memcpy) enables buffer overflow risks leading to RCE.
20 |   - /lib/librt.so.0: Unchecked memcpy in sym.mq_notify and recv call allows up to 0x20 bytes without length validation, enabling potential RCE.
21 |   - /lib/libc.so.0: Buffer overflow in sym.__uClibc_main due to unchecked memcpy, allowing potential RCE.
22 |   - /lib/libresolv-0.9.32.1.so: Multiple DNS-related vulnerabilities (CVE-2022-30295, CVE-2022-29503, CVE-2021-43523, CVE-2017-9729, CVE-2017-9728).
23 |   - /lib/libutil-0.9.32.1.so: Buffer overflow in sym.openpty due to unchecked strcpy, enabling potential RCE.
24 |   - /lib/libpthread.so.0: Multiple vulnerabilities (CVE-2022-30295, CVE-2021-43523, CVE-2017-9729, CVE-2017-9728, CVE-2016-6264) enabling DNS cache poisoning and stack exhaustion.
25 |   - /lib/libpng12.so.0: Buffer overflow vulnerabilities (e.g., CVE-2016-10087) in outdated libpng 1.2.56.
26 |   - /lib/libuci.so: Use-after-free vulnerability (CVE-2020-28951) and insecure strcpy usage enabling buffer overflow attacks.
27 |   - /lib/libcrypt.so.0: Buffer overflow due to misuse of memcpy without bounds checking.
28 |   - /lib/libevent-2.0.so.5: Integer overflows (CVE-2015-6525, CVE-2014-6272) enabling heap-based buffer overflows or infinite loops.
29 |   - /lib/ld-uClibc.so.0: Format string vulnerability in sym._dl_map_cache allowing potential RCE.
30 |   - /lib/libcyassl.so: Multiple memcpy calls without bounds checking leading to buffer overflow vulnerabilities.
31 |   - /lib/libdl.so.0: Multiple vulnerabilities (CVE-2022-29503, CVE-2017-9729, CVE-2017-9728) enabling memory corruption and out-of-bounds reads.
32 |   - /lib/libm.so.0: Critical vulnerabilities (CVE-2013-7039, CVE-2013-7038) enabling potential RCE and information disclosure.
33 |   - /sbin/hotplug2: Lack of stack canaries, ASLR, and NX bit enforcement; unsanitized system() call enables arbitrary command execution.
34 |   - /sbin/wget2nand: Unsanitized URL parameter allowing SSRF or unauthorized server access.
35 |   - /bin/busybox: Outdated BusyBox 1.19.4 with known RCE and buffer overflow vulnerabilities.
36 |   - /bin/vda: Directory traversal, stack overflow, use-after-free, and format string flaws enabling arbitrary code execution.
37 |   - /bin/tddpd: Private key exposure at /etc/tddpd/priv-key.pem with world-readable permissions.
38 |   - /bin/ipcd: Buffer overflow and command injection due to strcpy/system misuse.
39 |   - /bin/onvif: gSOAP library vulnerabilities enabling RCE and stack-based buffer overflow.
40 |   - /sbin/ubusd: Buffer overflow enabling arbitrary memory corruption and RCE.
41 |   - /sbin/sysupgrade: Insecure firmware update process allowing malicious code injection.
42 |   - /etc/passwd: Weak password hashing algorithm detected (MD5), making hashes susceptible to brute-force attacks.
43 |   - /etc/init.d/cfgmac: Hardcoded default MAC address (A8:57:4E:FD:93:5E) poses spoofing risks; reliance on ubus calls to 'tddpServer' introduces potential attack vector for unauthorized access.
44 | 
45 | - Major Issues:
46 |   - /etc/init.d/cloud_client: Dynamic URLs (`download_url`, `release_log_url`) lack validation, risking injection; use of md5sum for checksum verification is insecure and vulnerable to hash collision attacks.
47 |   - /etc/init.d/boot: Default credentials for hostname ('SLP') and timezone ('UTC') embedded; 'killall' used without strict parameter validation, risking unintended process termination.
48 |   - /etc/init.d/netlinkd: Version information exposure ("2008-2011 OpenWrt.org") aiding attackers in identifying potential vulnerabilities.
49 |   - /etc/init.d/ddns: Version information exposure ("2008-2012 OpenWrt.org") aiding attackers in identifying potential vulnerabilities; insecure default configuration uses 'eth0' as WAN interface.
50 |   - /etc/init.d/firewall: Outdated script (copyright 2008-2010) potentially containing known vulnerabilities; invokes `/sbin/fw` without security context validation.
51 |   - /etc/relayd.conf: Potential insecure network relay settings exposed via endpoint 'relay-ipc.tplinkcloud.com.cn:80', indicating possible internal network exposure.
52 |   - /etc/sysctl.conf: IPv6 forwarding globally enabled ('net.ipv6.conf.all.forwarding=1') and bridge firewalling enabled ('net.bridge.bridge-nf-call-iptables=1'), increasing attack surface unnecessarily.
53 |   - /etc/opkg.conf: Version information exposure in URL and insecure repository configuration using HTTP, enabling man-in-the-middle attacks and tampering with downloaded packages.
54 |   - /sbin/wifi: Weak WEP encryption logic exposing device to known vulnerabilities.
55 |   - /etc/rc.common: Version info exposure ('Copyright (C) 2006-2012 OpenWrt.org') aiding attackers in targeting known vulnerabilities associated with specific versions.
56 |   - /etc/group: Excessive group permissions potentially enabling privilege escalation.
57 |   - /etc/init.d/miniupnpd: Version information exposure ('2006-2011') aiding attackers in identifying potentially vulnerable components.
58 |   - /etc/init.d/sysctl: Setting 'net.core.dev_weight=0' could cause system instability by triggering unintended behavior in the NAPI poll function (CVE-2025-21806), leading to denial of service.
59 | 
60 | - Other Issues:
61 |   - /bin/cloud-client: Hardcoded token exposing cloud service credentials.
62 |   - /etc/shadow: User account structure revealed, aiding targeted attacks despite no direct sensitive data exposure.
63 | '''
64 | 
65 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/ui/Ubiquiti 4.3.22.11330/report.txt:
--------------------------------------------------------------------------------
  1 | '''
  2 | - [Location] etc/activate_tunnel.sh
  3 | - [Type] Component
  4 | - [Version Info] Unknown
  5 | - [Description] Script lacks input validation and sanitization for critical commands.
  6 | - [Details] The script dynamically retrieves network parameters and uses variables like $cfg, $cmd, $dev, and $remote without proper sanitization in commands such as `ip link` and `ip l2tp`, which could lead to command injection vulnerabilities.
  7 | - [Impact] Potential arbitrary command execution with script privileges.
  8 | - [Risk Level] High
  9 | 
 10 | - [Location] etc/common.sh
 11 | - [Type] Component
 12 | - [Version Info] Version referenced via "/lib/version"
 13 | - [Description] Exposure of version details and insecure handling of sensitive data in ramdisk.
 14 | - [Details] The script mounts a ramdisk and switches the root filesystem using `pivot_root`. It copies files like `/usr/etc/common.sh`, `/lib/version`, and `/bin/busybox` into the ramdisk, potentially exposing sensitive data if compromised.
 15 | - [Impact] Attackers may exploit known vulnerabilities associated with exposed versions or extract sensitive information from the ramdisk.
 16 | - [Risk Level] Medium
 17 | 
 18 | - [Location] etc/default_ar9344.cfg
 19 | - [Type] Credential/Configuration
 20 | - [Version Info] Unknown
 21 | - [Description] Exposure of plaintext passwords and default Wi-Fi PSK.
 22 | - [Details] Contains users.1.password=VvpvCwhccFv6Q and aaa.1.wpa.psk=DEFAULTPASSWORD, exposing credentials and pre-shared keys.
 23 | - [Impact] Unauthorized access to user accounts and Wi-Fi networks.
 24 | - [Risk Level] Critical
 25 | 
 26 | - [Location] etc/default_bcm5334x.cfg
 27 | - [Type] Credential
 28 | - [Version Info] Unknown
 29 | - [Description] Presence of plaintext password in configuration file.
 30 | - [Details] Contains users.1.password=VvpvCwhccFv6Q, exposing a plaintext password.
 31 | - [Impact] Unauthorized access to user accounts if the file is accessed by attackers.
 32 | - [Risk Level] High
 33 | 
 34 | - [Location] etc/default_nossid.cfg
 35 | - [Type] Credential/Configuration
 36 | - [Version Info] Unknown
 37 | - [Description] Exposure of plaintext password and use of default settings.
 38 | - [Details] Contains users.1.password=VvpvCwhccFv6Q and mgmt.is_default=true, indicating default configurations and exposed credentials.
 39 | - [Impact] Increased attack surface due to default settings and potential unauthorized access.
 40 | - [Risk Level] High
 41 | 
 42 | - [Location] etc/default_qca956x.cfg
 43 | - [Type] Credential/Configuration
 44 | - [Version Info] Unknown
 45 | - [Description] Default credentials and WPA PSK exposure, along with bridged network risks.
 46 | - [Details] Contains users.1.name=ubnt, users.1.password=VvpvCwhccFv6Q, aaa.1.wpa.psk=DEFAULTPASSWORD, and bridge.1.devname=br0, exposing sensitive data and internal devices.
 47 | - [Impact] Unauthorized access to user accounts, Wi-Fi networks, and internal devices.
 48 | - [Risk Level] Critical
 49 | 
 50 | - [Location] etc/.version
 51 | - [Type] Other
 52 | - [Version Info] 4.3.22
 53 | - [Description] Exposure of firmware version information.
 54 | - [Details] File contains "4.3.22", exposing specific firmware version details.
 55 | - [Impact] Attackers may exploit known vulnerabilities associated with this version.
 56 | - [Risk Level] Medium
 57 | 
 58 | - [Location] etc/hotplug2.rules
 59 | - [Type] Configuration
 60 | - [Version Info] Unknown
 61 | - [Description] Improper device handling with insecure permissions.
 62 | - [Details] Rules expose devices (e.g., /dev/%DEVICENAME%) with mode 0666, allowing unauthorized access.
 63 | - [Impact] Unauthorized access to critical device files.
 64 | - [Risk Level] Medium
 65 | 
 66 | - [Location] etc/profile
 67 | - [Type] Other
 68 | - [Version Info] Unknown
 69 | - [Description] Exposure of version details through `/etc/version`.
 70 | - [Details] File references `/etc/version`, potentially exposing system or software version information.
 71 | - [Impact] Attackers may identify and exploit vulnerabilities associated with the exposed version.
 72 | - [Risk Level] Low
 73 | 
 74 | - [Location] etc/protocols
 75 | - [Type] Other
 76 | - [Version Info] IPv6 and related components
 77 | - [Description] Exposure of version identifiers for protocols.
 78 | - [Details] File mentions IPv6 and related components with version identifiers.
 79 | - [Impact] Attackers may target specific versions with known vulnerabilities.
 80 | - [Risk Level] Medium
 81 | 
 82 | - [Location] etc/services
 83 | - [Type] Other
 84 | - [Version Info] Multiple services (e.g., Kerberos v5, POP version 2/3, IMAP version 2)
 85 | - [Description] Exposure of service versions and unnecessary network service ports.
 86 | - [Details] References to specific versions of services and ports like 'kpasswd' on port 761/tcp. CVEs (e.g., CVE-2018-5710, CVE-2012-1015) affect MIT Kerberos 5.
 87 | - [Impact] Potential denial of service, remote code execution, or exploitation of outdated protocols.
 88 | - [Risk Level] High
 89 | '''
 90 | '''
 91 | - [Location] etc/passwd
 92 | - [Type] Credential
 93 | - [Version Info] Unknown
 94 | - [Description] Password hash exposure for the 'ubnt' user.
 95 | - [Details] The file contains a password hash ('VvpvCwhccFv6Q') for the 'ubnt' user.
 96 | - [Impact] Exposure of password hashes can lead to offline brute-force attacks.
 97 | - [Risk Level] Medium
 98 | 
 99 | - [Location] etc/default-ec20.cfg
100 | - [Type] Configuration
101 | - [Version Info] Unknown
102 | - [Description] Default password and insecure wireless settings.
103 | - [Details] Default password (users.1.password=VvpvCwhccFv6Q), unencrypted wireless networks (wireless.1.security=none, wireless.2.security=none), and exposed version info via mgmt.flavor=ace.
104 | - [Impact] Potential unauthorized access and network exploitation.
105 | - [Risk Level] High
106 | 
107 | - [Location] etc/default_nossid_qca956x.cfg
108 | - [Type] Configuration
109 | - [Version Info] Unknown
110 | - [Description] Plaintext password and insecure wireless settings.
111 | - [Details] Plaintext password (users.1.password=VvpvCwhccFv6Q), wireless security disabled (wireless.1.security=none), hidden SSID (wireless.1.hide_ssid=true), and internal syslog server IP (syslog.remote.ip=192.168.1.1).
112 | - [Impact] Unauthorized system access and increased risk of network compromise.
113 | - [Risk Level] Critical
114 | 
115 | - [Location] etc/system.cfg
116 | - [Type] Configuration
117 | - [Version Info] Unknown
118 | - [Description] Plaintext password exposure for the user 'ubnt'.
119 | - [Details] Plaintext password (users.1.password=VvpvCwhccFv6Q) for the user 'ubnt'.
120 | - [Impact] Significant security risk if firmware is compromised.
121 | - [Risk Level] High
122 | 
123 | - [Location] etc/syswrapper.sh
124 | - [Type] Component
125 | - [Version Info] Unknown
126 | - [Description] Multiple security vulnerabilities including predictable lockfile paths, use of weak hashing algorithms, insecure handling of tokens, and command injection risks.
127 | - [Details] Predictable lockfile paths (/var/run/fwupdate.pid, /var/run/led.lock), weak hashing (MD5), plaintext token storage (/var/run/stream.token), use of `eval` without input validation, and insecure use of curl for firmware downloads.
128 | - [Impact] Privilege escalation, information disclosure, and potential remote code execution.
129 | - [Risk Level] Critical
130 | 
131 | - [Location] etc/ethertypes
132 | - [Type] Other
133 | - [Version Info] IPv4, IPv6
134 | - [Description] Exposure of IP version information.
135 | - [Details] Explicit mentions of IP versions (IPv4 and IPv6).
136 | - [Impact] Possible identification of protocol-specific vulnerabilities.
137 | - [Risk Level] Low
138 | '''
139 | '''
140 | - [Location] etc/rc.d/rc
141 | - [Type] Configuration
142 | - [Version Info] Unknown
143 | - [Description] Potential SSH key and certificate setup issue detected.
144 | - [Details] The script references 'rc.identity' for setting up certificates and SSH keys. It dynamically generates SSH keys if they are not present and creates symbolic links for web server certificates ('server.crt', 'server.key'). However, it does not enforce strong permissions or verify the integrity of these files.
145 | - [Impact] Improper handling could lead to unauthorized access due to weak file permissions or exposure of sensitive cryptographic material.
146 | - [Risk Level] Medium
147 | 
148 | - [Location] etc/rc.d/rc.btusb
149 | - [Type] Configuration
150 | - [Version Info] Unknown
151 | - [Description] Potential insecure handling of Bluetooth MAC address (bdaddr).
152 | - [Details] The script retrieves and processes a Bluetooth MAC address from '/proc/ubnthal/system.info' without validating its source or integrity.
153 | - [Impact] If an attacker manipulates this value, it could lead to unauthorized Bluetooth device impersonation or misconfiguration.
154 | - [Risk Level] Medium
155 | 
156 | - [Location] etc/rc.d/rc.identity
157 | - [Type] Credential
158 | - [Version Info] Unknown
159 | - [Description] Potential exposure of sensitive cryptographic material.
160 | - [Details] The script handles SSH keys (RSA and DSS) and web server certificates. It checks for pre-existing keys but generates new ones using dropbearkey if none are found. Permissions or storage locations are not explicitly secured.
161 | - [Impact] This could lead to unintended exposure of private keys if permissions or storage locations are improperly secured.
162 | - [Risk Level] High
163 | '''
164 | '''
165 | - [Location] etc/udhcpc/udhcpc
166 | - [Type] Component
167 | - [Version Info] BusyBox udhcpc version 1.20, CVE-2016-2148, CVE-2016-2147
168 | - [Description] The identified version of udhcpc is vulnerable to two critical vulnerabilities: CVE-2016-2148 (Heap-based buffer overflow) and CVE-2016-2147 (Integer overflow).
169 | - [Details] Both vulnerabilities affect versions of BusyBox udhcpc prior to 1.25.0. These issues could allow remote attackers to cause a denial of service or potentially execute arbitrary code.
170 | - [Impact] Remote code execution or denial of service by exploiting heap-based buffer overflow or integer overflow vulnerabilities.
171 | - [Risk Level] Critical
172 | 
173 | - [Location] etc/udhcpc/udhcpc_ip_only
174 | - [Type] Component
175 | - [Version Info] BusyBox udhcpc version unknown, CVE-2016-2148, CVE-2016-2147, CVE-2011-2716
176 | - [Description] Multiple vulnerabilities detected in the script including CVE-2016-2148 (Heap-based buffer overflow), CVE-2016-2147 (Integer overflow), and CVE-2011-2716 (Command injection via DHCP options). 
177 | - [Details] The script uses 'eval' to process configuration data dynamically without visible input sanitization. Specifically, the line `eval \`grep dhcpc\. $CFG_FILE | /bin/sed ...` processes data from '/tmp/system.cfg' or '/tmp/running.cfg', making it vulnerable to command injection if an attacker controls these files.
178 | - [Impact] Potential for remote code execution, denial of service, or command injection due to improper handling of dynamic input.
179 | - [Risk Level] Critical
180 | '''
181 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/ui/Ubiquiti 4.3.22.11330/summary.txt:
--------------------------------------------------------------------------------
 1 | '''
 2 | Firmware Summary:
 3 | [Basic Info]
 4 | - Name/Version: Ubiquiti 4.3.22.11330
 5 | - Device/Type/Arch: Ubiquiti device, ARM architecture
 6 | - Key Info: Linux kernel version 3.6.5, released on 2020-11-03
 7 | 
 8 | [Coverage] 
 9 | - Key Dirs: /usr/etc, /usr/www, /lib, /bin, /etc, /etc/rc.d, /etc/udhcpc
10 | - Key Files: /usr/etc/activate_tunnel.sh, /usr/etc/common.sh, /usr/etc/default_ar9344.cfg, /usr/etc/passwd, /etc/default_bcm5334x.cfg, /etc/default_nossid.cfg, /etc/.version, /etc/hotplug2.rules, /etc/profile, /etc/protocols, /etc/services, /etc/default-ec20.cfg, /etc/default_nossid_qca956x.cfg, /etc/system.cfg, /etc/syswrapper.sh, /etc/ethertypes, /etc/rc.d/rc, /etc/rc.d/rc.btusb, /etc/rc.d/rc.identity, /etc/udhcpc/udhcpc, /etc/udhcpc/udhcpc_ip_only
11 | 
12 | [Main Issues]
13 | - Critical Issues:
14 |   - /etc/system.cfg: Exposure of plaintext password for the user 'ubnt' (users.1.password=VvpvCwhccFv6Q), risking unauthorized access.
15 |   - /etc/syswrapper.sh: Use of `eval` with unsanitized inputs in functions like `check_vap_status` and `run`, allowing command injection vulnerabilities that could lead to remote code execution or privilege escalation.
16 |   - /etc/syswrapper.sh: Predictable lockfile paths (/var/run/fwupdate.pid, /var/run/led.lock) and insecure handling of sensitive keys/tokens (e.g., /var/run/stream.token) create risks of symlink attacks and unauthorized access.
17 |   - /usr/etc/activate_tunnel.sh: Lack of input sanitization for variables like $dev and $remote used in critical commands (`ip link`, `ip l2tp`), potentially allowing command injection vulnerabilities.
18 |   - /etc/hotplug2.rules: Improper device handling with insecure permissions (e.g., /dev/%DEVICENAME% with mode 0666), enabling unauthorized access to critical device files.
19 |   - /etc/rc.d/rc.identity: Insecure handling of SSH keys and web server certificates, including lack of enforced strong permissions or integrity checks, potentially exposing private keys and sensitive cryptographic material.
20 |   - /etc/udhcpc/udhcpc, /etc/udhcpc/udhcpc_ip_only: Multiple CVEs detected (CVE-2016-2148, CVE-2016-2147, CVE-2011-2716), exposing risks such as heap-based buffer overflow, integer overflow, and command injection via DHCP options, leading to remote code execution or denial of service.
21 | 
22 | - Major Issues:
23 |   - /etc/syswrapper.sh: Exposure of versioning details through variables like FW_MD5SUMFILE and /var/run/fwversion.next, increasing the risk of targeted attacks based on known vulnerabilities.
24 |   - /usr/etc/common.sh, /etc/.version, /etc/profile, /etc/protocols, /etc/default-ec20.cfg: Exposure of version information via `/lib/version`, `/etc/.version`, `/etc/profile`, `/etc/protocols`, and `mgmt.flavor=ace`, enabling attackers to exploit known vulnerabilities associated with this firmware version.
25 |   - /etc/default_nossid.cfg, /etc/default_qca956x.cfg, /etc/default-ec20.cfg, /etc/default_nossid_qca956x.cfg: Default settings (mgmt.is_default=true), bridged network configurations (bridge.1.devname=br0), and unencrypted wireless networks (wireless.1.security=none) increase attack surface by exposing internal devices and relying on insecure defaults.
26 |   - /etc/services: Presence of outdated or insecure protocols (e.g., Kerberos v4) and references to specific service versions (e.g., Kerberos v5) exposing the system to known vulnerabilities such as CVE-2018-5710, CVE-2018-5709, and CVE-2012-1015.
27 |   - /etc/rc.d/rc.btusb: Insecure handling of Bluetooth MAC address (bdaddr) from '/proc/ubnthal/system.info' without source validation, risking Bluetooth device impersonation or misconfiguration.
28 |   - /etc/udhcpc/udhcpc, /etc/udhcpc/udhcpc_ip_only: Use of `eval` with unsanitized input from configuration files ('/tmp/system.cfg', '/tmp/running.cfg'), creating a command injection vulnerability that could allow arbitrary command execution.
29 | 
30 | - Other Issues:
31 |   - /etc/ethertypes: Exposure of IP version information (IPv4, IPv6), which could assist attackers in identifying protocol-specific vulnerabilities.
32 |   - /etc/default_nossid_qca956x.cfg: Presence of specific IP addresses (e.g., 192.168.1.20, 192.168.1.1) indicating sensitive network configurations and potential internal infrastructure exposure.
33 |   - /etc/rc.d/rc: Potential SSH key setup detected with improper configuration risks due to sourcing 'rc.identity', which may expose sensitive data if not securely handled.
34 | '''
35 | 


--------------------------------------------------------------------------------
/firmanalyzer/Examples/ui/Ubiquiti Linux-2.6.32.71/summary:
--------------------------------------------------------------------------------
 1 | '''
 2 | Firmware Summary:
 3 | [Basic Info]
 4 | - Name/Version: Ubiquiti Linux-2.6.32.71
 5 | - Device/Type/Arch: MIPS32
 6 | - Key Info: Kernel version 2.6.32.71, created 2018-05-23
 7 | 
 8 | [Coverage] 
 9 | - Key Dirs: /usr/etc, /usr/www, /bin, /lib, /lib/ebtables, /lib/iptables, /lib/network, /lib/firmware, /lib/modules, /lib/wifi, /lib/ddns, /lib/firewall, /lib/pppd, /lib/tinysnmp, /lib/ubnt, /usr/etc/ppp, /usr/etc/udhcpc, /usr/etc/usb_modeswitch.d, /usr/etc/rc.d
10 | - Key Files: /usr/etc/server.key, /usr/etc/system.cfg, /usr/etc/services, bin/busybox, bin/lighttpd, bin/dropbear, lib/libcrypto.so.1.0.0, lib/libssl.so.1.0.0, lib/libuClibc-0.9.29.so, lib/libpcap.so.1, lib/libssh2.so.1.0.1, lib/libwebsockets.so.10, lib/libjson-c.so.2.0.1, lib/libevent-2.1.so.6.0.2, lib/libusb-0.1.so.4.4.4, lib/ebtables/libebt_ip.so, lib/ebtables/libebt_nat.so, lib/firewall/uci_firewall.sh, lib/ddns/dynamic_dns_functions.sh, lib/ddns/dynamic_dns_updater.sh, lib/tinysnmp/interfaces.so, lib/tinysnmp/ubnt.so, lib/tinysnmp/ieee802dot11.so, lib/tinysnmp/resources.so, lib/ubnt/cl_functions.sh, lib/wifi/hostapd.sh, lib/wifi/wpa_supplicant.sh, lib/pppd/2.4.4/rp-pppoe.so, /usr/www/sshd-authkeys.cgi, /usr/www/fwflash.cgi, /usr/www/ubnt.cgi, /usr/www/network.cgi, /usr/www/status.cgi, /usr/www/ubnt.net.js, /usr/www/system.cgi, /usr/www/services.cgi, /usr/www/getboardinfo.sh, /usr/etc/lighttpd/clighttpd.conf, /usr/etc/rc.d/rc.sysinit, /usr/etc/rc.d/rc.softrestart
11 | 
12 | [Security Issues]
13 | - Critical Issues: 
14 |   - /usr/etc/server.key: Hardcoded private key found in firmware, not protected by passphrase, exposing encrypted communications to compromise
15 |   - /usr/etc/system.cfg: Exposed password hash for user 'ubnt' ($1$tL963iDU$SXu0h02ZZYfnoZcPkIlK21) with SSH enabled on port 22, risking unauthorized access
16 |   - /usr/www/fwflash.cgi: Hardcoded token-based authentication and lack of input validation for $do_update variable, risking unauthorized firmware updates
17 |   - /usr/www/status.cgi: Multiple critical vulnerabilities including buffer overflow risks due to unsafe 'gets' function usage, lack of input validation, and potential for arbitrary code execution
18 |   - /usr/www/system.cgi: Insecure password handling using crypt() for hashing, potentially insecure token-based authentication, and weak password policy with default credentials ('ubnt' and 'guest')
19 |   - /usr/www/services.cgi: Insecure handling of sensitive credentials (dyndns.1.password, https_cert_key_file) stored in plaintext, potential command injection via 'exec' function
20 |   - bin/busybox: Outdated BusyBox v1.24.2 with multiple critical CVEs (CVE-2022-48174, CVE-2022-30065, CVE-2021-42386)
21 |   - bin/lighttpd: Outdated OpenSSL 1.0.0 with critical vulnerabilities (CVE-2014-0160, CVE-2014-0224, CVE-2014-0195)
22 |   - bin/dropbear: Outdated Dropbear SSH version 2016.74 with potential unpatched vulnerabilities
23 |   - lib/libcrypto.so.1.0.0: Outdated OpenSSL 1.0.2m with multiple critical CVEs (CVE-2017-3738, CVE-2017-3737, CVE-2017-3736, CVE-2017-3735)
24 |   - lib/libssl.so.1.0.0: Outdated OpenSSL 1.0.2m with multiple critical CVEs (CVE-2017-3738, CVE-2017-3737, CVE-2017-3736, CVE-2017-3735)
25 |   - lib/libuClibc-0.9.29.so: Outdated uClibc version 0.9.29 with critical vulnerabilities (CVE-2022-30295, CVE-2022-29503, CVE-2017-9729, CVE-2017-9728)
26 |   - lib/libpcap.so.1: Outdated libpcap version 1.8.1 with multiple critical CVEs (CVE-2019-15165, CVE-2019-15164, CVE-2019-15163, CVE-2019-15162, CVE-2019-15161)
27 |   - lib/libssh2.so.1.0.1: Outdated libssh2 version 1.0.1 with critical vulnerabilities (CVE-2023-48795, CVE-2019-3857, CVE-2019-3855)
28 |   - lib/libwebsockets.so.10: Outdated libwebsockets library with potential use of insecure SSL protocols (SSLv23_server_method)
29 |   - lib/libjson-c.so.2.0.1: Outdated libjson-c version with critical CVEs (CVE-2020-12762, CVE-2013-6371, CVE-2013-6370)
30 |   - lib/libevent-2.1.so.6.0.2: Outdated libevent version 2.1.6.0.2 with critical vulnerabilities
31 |   - lib/libusb-0.1.so.4.4.4: Outdated libusb version 0.1.4 with critical vulnerabilities
32 |   - lib/ebtables/libebt_ip.so: High-risk function fcn.00000c9c uses unsafe string and integer handling functions (strdup, strchr, strtol) without proper input validation or boundary checks
33 |   - lib/ebtables/libebt_nat.so: Critical vulnerabilities in functions fcn.00000ac8 (use of 'gets'), fcn.00000de8 (lack of initialization/validation), and fcn.000006a4 (loop without boundary checks)
34 |   - lib/firewall/uci_firewall.sh: Insecure default firewall policy configuration (DEF_INPUT=DROP, DEF_OUTPUT=DROP, DEF_FORWARD=DROP)
35 |   - lib/ddns/dynamic_dns_functions.sh: Use of insecure HTTP protocol for IP address retrieval from 'http://checkip.dyndns.org'
36 |   - lib/ddns/dynamic_dns_updater.sh: Insecure handling of credentials in URL construction
37 |   - lib/tinysnmp/interfaces.so: High-risk vulnerabilities in `sym.getdevstats_stub` (dynamic call via `jalr t9` allowing arbitrary code execution)
38 |   - lib/tinysnmp/ubnt.so: Multiple high-risk functions identified, including potential buffer overflow vulnerabilities, insecure dynamic function calls, and insufficient input validation
39 |   - lib/tinysnmp/ieee802dot11.so: Critical vulnerabilities in functions `fcn.00000a9c`, `fcn.000018b4`, and `fcn.00000868` due to improper use of unsafe functions
40 |   - lib/tinysnmp/resources.so: High-risk functions identified: 1) `fcn.000007e8` contains multiple external calls without input/output validation
41 |   - lib/ubnt/cl_functions.sh: Insecure file handling and lock mechanism issues, including potential race conditions and symlink attacks in `cl_lock` function
42 |   - lib/wifi/hostapd.sh: Insecure cryptographic configuration supporting outdated protocols (WPA1, TKIP)
43 |   - lib/wifi/wpa_supplicant.sh: Sensitive credentials (private_key_passwd and password) written to /var/run/wpa_supplicant-$ifname.conf in plaintext
44 |   - lib/pppd/2.4.4/rp-pppoe.so: Critical vulnerabilities including potential buffer overflow in `fcn.000018c0` due to unsafe `sprintf`
45 |   - /usr/www/sshd-authkeys.cgi: Insecure SSH key management with token-based access control vulnerable to compromise or bypass
46 |   - /usr/www/getboardinfo.sh: Potential sensitive file exposure through output of '/etc/board.info' content
47 |   - /usr/etc/lighttpd/clighttpd.conf: Insecure configuration exposing internal paths and file structures, potential unauthorized access through 'airos.deny' and 'airos.allow' directives
48 |   - /usr/etc/lighttpd/lighttpd.conf: Insecure CGI handling and file access control, allowing execution of multiple CGI scripts without proper security context and permitting access to sensitive files like 'airview_manager.jnlp' and 'airview.jnlp'
49 |   - /usr/etc/ppp/ip-up: Insecure file handling and command execution risks, reads from '/tmp/running.cfg' and '/tmp/system.cfg' without validation, executes services from '/etc/udhcpc_services' without proper validation, risking arbitrary command execution
50 |   - /usr/etc/ppp/ip-down: Insecure file handling and command execution risks, reads from '/tmp/running.cfg' and '/tmp/system.cfg' without validation, executes external scripts (`/etc/ppp/rssi_decode.sh`) without explicit validation, risking arbitrary command execution
51 |   - /usr/etc/rc.d/rc.sysinit: Kernel panic settings ('echo "3" > /proc/sys/kernel/panic' and 'echo "1" > /proc/sys/vm/panic_on_oom') may cause system instability and denial of service
52 |   - /usr/etc/rc.d/rc: Insecure watchdog control functions (watchdog_stop and watchdog_start) that could be exploited to cause system instability or denial of service
53 |   - /usr/etc/rc.d/rc.modules: Insecure command execution through file paths in 'load_modules' and 'unload_modules' functions, processing files from '/etc/modules.d/*' and '/etc/modules.blacklist' without validation, risking command injection
54 |   - /usr/etc/rc.d/rc.softrestart: Use of temporary files with predictable names (e.g., /tmp/.system.cfg.$$, /tmp/.running.cfg.$$) risking race condition attacks, and execution of external binaries (/sbin/uav, /sbin/ubntconf) without validation, risking arbitrary code execution
55 |   - /usr/etc/rc.d/rc.stop: Insecure file handling and cleanup operations, removing files and directories (e.g., `/var/log/*`, `/tmp/.sessions.tdb`) without proper validation or sanitization, risking unintended file deletions or security issues
56 |   - /usr/etc/udhcpc/udhcpc: Insecure command execution via `eval` in `restore_ip_aliases` function, exposing sensitive network configuration details in `/etc/udhcpc/info.$interface`
57 | 
58 | - Major Issues: 
59 |   - /usr/www/*.js.gz: Multiple compressed JavaScript files found in web directory, potential for hidden vulnerabilities
60 |   - bin/dhcp-fwd: Version information exposure through '-v' and '--version' options
61 |   - bin/iperf: Version information exposure (iperf version 2.0.4) and CVE-2023-7250 (Denial of Service vulnerability)
62 |   - /usr/www/ubnt.net.js: Hardcoded IP addresses and network configurations found in the code, including fallback IPs (192.168.1.20, 192.168.10.1) and netmasks (255.255.255.0)
63 |   - /usr/etc/ppp: Potential network configuration vulnerabilities in PPP settings
64 |   - /usr/etc/rc.d: Potential system service vulnerabilities in startup scripts
65 |   - /usr/etc/rc.d/rc.sysinit: Hardcoded hostname ('echo UBNT > /proc/sys/kernel/hostname') could reveal system manufacturer/model, and responding to broadcast pings ('echo "0" > /proc/sys/net/ipv4/icmp_echo_ignore_broadcasts') exposes system to network discovery attacks
66 |   - /usr/etc/ppp: Potential IPv6 configuration vulnerabilities in PPP scripts
67 |   - /usr/etc/usb_modeswitch.d: Potential USB mode switching vulnerabilities in configuration files
68 |   - /usr/etc/udhcpc: Potential DHCP client vulnerabilities in configuration
69 | 
70 | - Other Issues: 
71 |   - Kernel version 2.6.32.71 is outdated and may contain unpatched vulnerabilities
72 | '''
73 | 


--------------------------------------------------------------------------------
/firmanalyzer/LogManage.py:
--------------------------------------------------------------------------------
 1 | import logging
 2 | import os
 3 | from typing import Optional, Dict
 4 | from pathlib import Path
 5 | 
 6 | class LogManager:
 7 |     """Centralized logging management for the firmware analyzer"""
 8 |     
 9 |     _instances: Dict[str, logging.Logger] = {}
10 |     _initialized: bool = False
11 |     
12 |     @classmethod
13 |     def setup(cls, base_log_path: str, console_level: int = logging.INFO, file_level: int = logging.DEBUG):
14 |         """Initialize logging configuration"""
15 |         if cls._initialized:
16 |             return
17 |             
18 |         # Create log directory if it doesn't exist
19 |         os.makedirs(base_log_path, exist_ok=True)
20 |         
21 |         # Configure root logger
22 |         root_logger = logging.getLogger()
23 |         root_logger.setLevel(logging.DEBUG)
24 |         
25 |         # Clear any existing handlers
26 |         root_logger.handlers.clear()
27 |         
28 |         # Create formatters
29 |         console_formatter = logging.Formatter('%(levelname)s %(name)s: %(message)s')
30 |         file_formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
31 |         
32 |         # Console handler
33 |         console_handler = logging.StreamHandler()
34 |         console_handler.setLevel(console_level)
35 |         console_handler.setFormatter(console_formatter)
36 |         root_logger.addHandler(console_handler)
37 |         
38 |         # File handler for main log
39 |         main_log_path = os.path.join(base_log_path, 'analyzer.log')
40 |         file_handler = logging.FileHandler(main_log_path)
41 |         file_handler.setLevel(file_level)
42 |         file_handler.setFormatter(file_formatter)
43 |         root_logger.addHandler(file_handler)
44 |         
45 |         cls._initialized = True
46 |     
47 |     @classmethod
48 |     def get_logger(cls, name: str, log_file: Optional[str] = None) -> logging.Logger:
49 |         """Get a logger with optional separate log file
50 |         
51 |         Args:
52 |             name: Logger name (usually module name)
53 |             log_file: Optional separate log file path for this logger
54 |             
55 |         Returns:
56 |             logging.Logger: Configured logger instance
57 |         """
58 |         if name in cls._instances:
59 |             return cls._instances[name]
60 |             
61 |         logger = logging.getLogger(name)
62 |         
63 |         # Add separate file handler if specified
64 |         if log_file:
65 |             file_handler = logging.FileHandler(log_file)
66 |             file_handler.setFormatter(
67 |                 logging.Formatter('%(asctime)s - %(levelname)s - %(message)s')
68 |             )
69 |             file_handler.setLevel(logging.DEBUG)
70 |             logger.addHandler(file_handler)
71 |         
72 |         cls._instances[name] = logger
73 |         return logger
74 | 


--------------------------------------------------------------------------------
/firmanalyzer/README.md:
--------------------------------------------------------------------------------
 1 | # FirmAnalyzer - Intelligent Firmware Analysis System
 2 | 
 3 | ## System Architecture
 4 | 
 5 | ```mermaid
 6 | sequenceDiagram
 7 |     participant User
 8 |     participant Runner
 9 |     participant Explorer
10 |     participant Analyzer
11 |     participant Tools
12 |     participant LLMAssistant
13 |     
14 |     User->>Runner: Input firmware & custom prompts
15 |     Note over Runner: Load prompts from YAML
16 |     Runner->>Runner: Extract & locate root
17 |     Runner->>Explorer: Start exploration
18 |     
19 |     loop Directory Analysis
20 |         Explorer->>Explorer: Scan directory content
21 |         Explorer->>Analyzer: Assign analysis tasks
22 |         
23 |         par Parallel Analysis
24 |             Analyzer->>Tools: Binary analysis
25 |             Tools-->>Analyzer: Raw findings
26 |             
27 |             Analyzer->>LLMAssistant: Risk assessment
28 |             LLMAssistant-->>Analyzer: Security evaluation
29 |             
30 |             Analyzer->>Tools: Configuration check
31 |             Tools-->>Analyzer: Config issues
32 |         end
33 |         
34 |         Analyzer-->>Explorer: Analysis results
35 |         Explorer->>Explorer: Summarize findings
36 |         Note over Explorer: Make next decision
37 |         Explorer->>Explorer: Select next target
38 |     end
39 |     
40 |     Explorer-->>User: Security report
41 | ```
42 | 
43 | ## Core Components
44 | 
45 | ### Main Components
46 | - **main.py** - System entry point and orchestration
47 | - **explore.py** - Firmware filesystem exploration engine
48 | - **analyze.py** - File analysis and security assessment core
49 | 
50 | ### Configuration
51 | - **requirements.yaml**
52 |   - File type definitions and analysis rules
53 |   - Priority directory configurations
54 |   - Security severity criteria
55 |   - Analysis workflow specifications
56 | 
57 | ## Requirements
58 | - Python 3.8+
59 | - radare2 5.9.9
60 | - binwalk v3.10(rust-binwalk)
61 | 
62 | 
63 | 
64 | 


--------------------------------------------------------------------------------
/firmanalyzer/callback.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | import logging
 3 | from typing import Dict, Any, List
 4 | from langchain_core.callbacks import BaseCallbackHandler
 5 | 
 6 | class TokenUsageCallbackHandler(BaseCallbackHandler):
 7 |     def __init__(self, save_path):
 8 |         super().__init__()
 9 |         self.total_prompt_tokens = 0
10 |         self.total_completion_tokens = 0
11 |         self.total_cost = 0
12 |         self.save_path = save_path
13 |         
14 |     def on_llm_start(self, serialized: Dict[str, Any], prompts: List[str], **kwargs: Any) -> None:
15 |         """Called when LLM invocation starts"""
16 |         logging.info("[Prompt]")
17 |         for i, prompt in enumerate(prompts, 1):
18 |             logging.info(f"\n{'-' * 50}\n{prompt}\n{'-' * 50}")
19 |         
20 |     def on_llm_end(self, response: Any, **kwargs: Any) -> None:
21 |         """Called when LLM invocation ends"""
22 |         try:
23 |             # Log the raw LLM response
24 |             if hasattr(response, 'generations'):
25 |                 for gen in response.generations:
26 |                     if gen:
27 |                         logging.info(f"\n{'-' * 50}\n{gen[0].text}\n{'-' * 50}")
28 | 
29 |             if hasattr(response, 'llm_output') and response.llm_output:
30 |                 token_usage = response.llm_output.get('token_usage', {})
31 |                 
32 |                 prompt_tokens = token_usage.get('prompt_tokens', 0)
33 |                 completion_tokens = token_usage.get('completion_tokens', 0)
34 |                 
35 |                 input_cost = prompt_tokens * (2.50 / 1_000_000)
36 |                 output_cost = completion_tokens * (10.00 / 1_000_000)
37 |                 
38 |                 self.total_prompt_tokens += prompt_tokens
39 |                 self.total_completion_tokens += completion_tokens
40 |                 self.total_cost += input_cost + output_cost
41 |                 
42 |                 print(f"\n📊 [Token Usage for this call]")
43 |                 print(f"Input tokens: {prompt_tokens:,} (${input_cost:.4f})")
44 |                 print(f"Output tokens: {completion_tokens:,} (${output_cost:.4f})")
45 |                 print(f"Total tokens: {prompt_tokens + completion_tokens:,}")
46 |                 print(f"Running total cost: ${self.total_cost:.4f}")
47 | 
48 |                 # Save token usage
49 |                 usage_data = {
50 |                     "input_cost": input_cost,
51 |                     "output_cost": output_cost,
52 |                     "total_cost": self.total_cost
53 |                 }
54 |                 
55 |                 with open(self.save_path, 'a', encoding='utf-8') as f:
56 |                     json.dump(usage_data, f, ensure_ascii=False)
57 |                     f.write("\n")
58 |                     
59 |         except Exception as e:
60 |             logging.error(f"Error in token usage calculation: {str(e)}")
61 |             if hasattr(response, 'llm_output'):
62 |                 logging.debug("LLM output: %s", response.llm_output)


--------------------------------------------------------------------------------
/firmanalyzer/client.py:
--------------------------------------------------------------------------------
 1 | import configparser
 2 | from openai import OpenAI
 3 | 
 4 | def get_api_key():
 5 |     config = configparser.ConfigParser()
 6 |     config.read('config.ini')
 7 |     try:
 8 |         return config['Settings']['Model'],config['Settings']['ModelApiKey'], config['Settings']['OrgId'], config['Settings']['ProjectId'],config['Settings']['BaseURL']
 9 |     except KeyError:
10 |         raise KeyError("Cannot find 'ModelApiKey' in 'Settings' section of config.ini")
11 | 
12 | def create_openai_client():
13 |     model,api_key, org_id, project_id, base_url = get_api_key()
14 |     try:
15 |         client = OpenAI(
16 |             api_key=api_key,
17 |             base_url=base_url,
18 |             # organization=org_id,
19 |             # project=project_id,
20 |             timeout=60,
21 |         )
22 |         return model,client
23 |     except Exception as e:
24 |         print(f"[OpenAI] Failed to create client: {str(e)}")
25 |         raise


--------------------------------------------------------------------------------
/firmanalyzer/llm_config.py:
--------------------------------------------------------------------------------
  1 | import logging
  2 | import configparser
  3 | from langchain_openai import ChatOpenAI
  4 | from typing import Optional, Tuple, List
  5 | from langchain_core.runnables import RunnableLambda
  6 | 
  7 | class LLMClient:
  8 |     _instance = None
  9 |     _llm = None
 10 |     _callbacks = None
 11 |     
 12 |     def __new__(cls, config_path: str = 'config.ini'):
 13 |         if cls._instance is None:
 14 |             cls._instance = super(LLMClient, cls).__new__(cls)
 15 |         return cls._instance
 16 | 
 17 |     def __init__(self, config_path: str = 'config.ini'):
 18 |         if not hasattr(self, 'initialized'):
 19 |             self.config_path = config_path
 20 |             self.model = None
 21 |             self.api_key = None 
 22 |             self.org_id = None
 23 |             self.project_id = None
 24 |             self.base_url = None
 25 |             self._callbacks = []
 26 |             self.initialized = True
 27 |     
 28 |     def add_callback(self, callback) -> None:
 29 |         if callback not in self._callbacks:
 30 |             self._callbacks.append(callback)
 31 |             if self._llm:
 32 |                 self._llm.callbacks = self._callbacks
 33 | 
 34 |     def set_callbacks(self, callbacks: List) -> None:
 35 |         self._callbacks = callbacks
 36 |         if self._llm:
 37 |             self._llm.callbacks = self._callbacks
 38 | 
 39 |     def get_config(self) -> Tuple[str, str, str, str, str]:
 40 |         if all([self.model, self.api_key, self.org_id, self.project_id, self.base_url]):
 41 |             return self.model, self.api_key, self.org_id, self.project_id, self.base_url
 42 |             
 43 |         config = configparser.ConfigParser()
 44 |         config.read(self.config_path)
 45 |         
 46 |         try:
 47 |             self.model = config['Settings']['Model']
 48 |             self.api_key = config['Settings']['ModelApiKey']
 49 |             self.org_id = config['Settings']['OrgId']
 50 |             self.project_id = config['Settings']['ProjectId'] 
 51 |             self.base_url = config['Settings']['BaseURL']
 52 |             
 53 |             return self.model, self.api_key, self.org_id, self.project_id, self.base_url
 54 |             
 55 |         except KeyError as e:
 56 |             logging.error(f"Missing required config: {str(e)}")
 57 |             raise KeyError(f"Missing required config in 'Settings' section of {self.config_path}: {str(e)}")
 58 |         except Exception as e:
 59 |             logging.error(f"Error reading config: {str(e)}")
 60 |             raise
 61 | 
 62 |     def get_llm(self, temperature: float = 0) -> ChatOpenAI:
 63 |         if not self._llm:
 64 |             model, api_key, org_id, project_id, base_url = self.get_config()
 65 |             if model == "deepseek-reasoner":
 66 |                 base_url = "https://api.deepseek.com/beta"
 67 |             self._llm = ChatOpenAI(
 68 |                 model=model,
 69 |                 api_key=api_key, 
 70 |                 # temperature=temperature,
 71 |                 # organization=org_id,
 72 |                 base_url=base_url,
 73 |                 callbacks=self._callbacks,
 74 |                 timeout=120
 75 |             )
 76 |             
 77 |         return self._llm 
 78 | 
 79 |     def stream(self, messages: List[dict], temperature: Optional[float] = 0) -> str:
 80 |         try:
 81 |             llm = self.get_llm(temperature=temperature)
 82 |             result = []
 83 |             for chunk in llm.stream(messages):
 84 |                 result.append(chunk.content)
 85 |             return "".join(result)
 86 |         except Exception as e:
 87 |             logging.error(f"Stream call failed: {str(e)}")
 88 |             raise
 89 | 
 90 |     def invoke(self, messages: List[dict], temperature: Optional[float] = 0) -> str:
 91 |         try:
 92 |             llm = self.get_llm(temperature=temperature)
 93 |             return llm.invoke(messages).content
 94 |         except Exception as e:
 95 |             logging.error(f"Invoke call failed: {str(e)}")
 96 |             raise 
 97 |             
 98 |     def as_runnable(self, temperature: Optional[float] = 0) -> RunnableLambda:
 99 |         def _invoke(content: str) -> str:
100 |             messages = [{"role": "user", "content": content}]
101 |             return self.stream(messages, temperature=temperature)
102 |         
103 |         return RunnableLambda(_invoke)
104 | 
105 |     def as_runnable_sync(self, temperature: Optional[float] = 0) -> RunnableLambda:
106 |         def _invoke(content: str) -> str:
107 |             messages = [{"role": "user", "content": content}]
108 |             return self.invoke(messages, temperature=temperature).content
109 |         
110 |         return RunnableLambda(_invoke)


--------------------------------------------------------------------------------
/firmanalyzer/requirements.yaml:
--------------------------------------------------------------------------------
  1 | file_requirements:
  2 |   user: |
  3 |     - Focus analysis on files that can be externally triggered, accept user input, or impact system behavior. Prioritize files that meet **any** of the following conditions:
  4 | 
  5 |     - Executable binaries (ELF or scripts):
  6 |       * Accept external input (parameters, environment variables, file content, network data)
  7 |       * Registered in system startup scripts (e.g. rcS, init.d, inittab)
  8 |       * Triggered by web forms, CGI, or JavaScript requests
  9 |       * Perform critical operations such as command execution, file manipulation, or network access
 10 |       * Contain dangerous function calls (e.g., system, strcpy, sprintf, popen)
 11 |       
 12 |       - Dynamic libraries or shared objects (.so):
 13 |       * Files are shared object type (.so), or versioned links (e.g. libssl.so.1.0.2)
 14 |       * Present in dependency chains of known components or executables
 15 | 
 16 |     - Network service components:
 17 |       * Contain socket, bind, listen functionality
 18 |       * Bind to external interfaces (eth0, br0, 0.0.0.0) or open ports
 19 |       * Examples include: telnetd, pppd, udhcpd, smac2_tftpd, UDPserver, miniigd
 20 |       * Evaluate whether these accept unauthenticated input or expose default services
 21 | 
 22 |     - Web-related files:
 23 |       * Web server binaries (boa, httpd, mini_httpd, etc.)
 24 |       * Executable CGI scripts or shell scripts, commonly located in /bin, /cgi-bin, /www
 25 |       * HTML or JavaScript files containing forms, user input fields, or dynamic requests
 26 |       * Web configuration files (e.g., boa.conf) that define CGI paths or script execution permissions
 27 | 
 28 |     - Startup and configuration files:
 29 |       * Startup scripts (e.g., /etc/init.d/*, rcS, inittab) that invoke services
 30 |       * Config files specifying interface bindings, open ports, authentication modes, or firmware upgrade routines
 31 |       * Dynamic execution hooks (e.g., auto-update scripts, scheduled tasks)
 32 | 
 33 |     - Sensitive data files (analyze **only if externally accessible**):
 34 |       * Files containing plaintext credentials, keys, API tokens, or certificates in /etc/* (e.g., passwd, shadow, smbpasswd, *.pem)
 35 |       * Prioritize if accessible through web, services, or user-controlled paths
 36 | 
 37 |     - Exclusion scope (deprioritized or skipped):
 38 |       * Core system utilities (e.g., cp, mv, echo, cat) are not analyzed unless explicitly triggered with user-controlled input
 39 |       * Static, unused resource files are considered low priority
 40 | 
 41 | 
 42 | directory_requirements:
 43 |   user: |
 44 |     **Key Analysis Targets**
 45 |     1. Executable Locations
 46 |       - bin/
 47 |       - sbin/
 48 |       - usr/bin/
 49 |       - usr/sbin/
 50 |       - cgi-bin/
 51 |       - Contains triggerable ELF, scripts, CGI
 52 |       - Check for dangerous function calls or system command execution
 53 | 
 54 |     2. Sensitive Files
 55 |       - etc/
 56 |       - Contains startup process, authentication info, network bindings
 57 |       - Check for external interface bindings, plaintext passwords, config weaknesses
 58 | 
 59 |       - lib/
 60 |       - Contains custom or third-party .so libraries that may have vulnerable logic
 61 | 
 62 |     3. Web Interfaces & Upgrade Logic
 63 |       - www/
 64 |       - web/
 65 |       - upgrade/
 66 |       - Check for config uploads, firmware upgrades, web backend execution scripts
 67 | 
 68 |     **Priority Levels**
 69 |     - Priority 1 (Critical)
 70 |       - Components or scripts that can be directly accessed, triggered or listened from external
 71 |     - Priority 2 (High)
 72 |       - Config files, key files, library files affecting system behavior or authentication
 73 |     - Priority 3 (Medium)
 74 |       - Auxiliary scripts, display pages, logs, upload files etc.
 75 | 
 76 | file_findings_requirements:
 77 |   user: |
 78 |     **Analysis Workflow**
 79 |     0. Attack Surface Discovery
 80 |       - Check for user input paths (web forms, JS, network connections, file parameters)
 81 |       - Check if component is running (started by init script, listening ports, daemon)
 82 |       - Check for input → dangerous function paths (system, strcpy etc.)
 83 | 
 84 |     1. Information Discovery
 85 |       - Detect versions(executable or shared library), passwords, keys, interfaces, tokens and other sensitive info
 86 | 
 87 |     2. Security Review
 88 |       - Check if services/ports are exposed
 89 |       - Check if configs allow unauthorized access or use weak encryption
 90 |       - Check if startup items load high-risk components
 91 | 
 92 |     3. Code Analysis
 93 |       - Find command execution functions, memory operation functions, input reading functions
 94 |       - Check if unvalidated input is used for dangerous operations
 95 |       - Track data flow to see if user input can affect system calls
 96 | 
 97 |     4. Vulnerability Search (Including Version Analysis)
 98 |       - Match CVE vulnerabilities based on component versions (libraries or binaries)
 99 |       - **Must list all CVEs matching loaded component versions even if no clear attack path is found**
100 | 
101 |     severity_rating:
102 |       level_5_critical:
103 |         description: Input → No validation → Dangerous function → Executable
104 |         examples:
105 |           - Remote Code Execution (RCE)
106 |           - Command Injection
107 |           - Private Key or Root Credential Exposure
108 |           - Encryption Bypass
109 |           - Arbitrary File Read/Write
110 |           - Dynamic Library Hijacking
111 |           - Configuration or script directly launches vulnerable or unauthorized executable
112 | 
113 |       level_4_high:
114 |         description: Controllable input + Data leakage + Weak configuration
115 |         examples:
116 |           - Password/API Key Exposure
117 |           - Privilege Escalation
118 |           - Dangerous Function Controlled by Input
119 |           - Weak or Disabled Encryption
120 |           - Sensitive Data in Plaintext Transmission
121 |           - Web Vulns: SSRF, CSRF, IDOR
122 |           - File references or configures execution of another risky or misconfigured component
123 |           - Indirect execution chain identified from user input to a dangerous binary
124 | 
125 |       level_3_medium:
126 |         description: Vulnerability exists but exploit path unclear or uncontrollable
127 |         examples:
128 |           - Known Version information or Vulnerable Component Loaded
129 |           - Default Credentials or Weak Permissions
130 |           - Exposed Configs with Limited Risk
131 |           - Hardcoded Interface Info
132 |           - Flawed Auth Logic (with conditions)
133 |           - Config or script references other components but path not fully controllable or executable
134 |           - Component linking observed but no clear attack surface
135 | 
136 |       level_0_2_low:
137 |         description: No exploit path, info leakage or minor misconfig
138 |         examples:
139 |           - Debug Info, Test Interfaces, Sensitive Comments
140 |           - Unused Open Ports or Services
141 |           - Minor Config Errors (e.g. DNS Leak, Timezone)
142 |           - References to other components exist but not executed or not exposed
143 |           - Inactive or broken component configuration linkage
144 | 
145 | security_report_template:
146 |   user: |
147 |     - [Location] Relative path
148 |     - [Type] Component/Credential/Configuration/Other
149 |     - [Version Info] Version/release information and CVE number if applicable
150 |     - [Description] Detailed issue description
151 |     - [Details] Technical details/Sensitive information
152 |     - [Impact] Potential security impact
153 |     - [Risk Level] Critical/High/Medium/Low
154 | 
155 | summary_template:
156 |   user: |
157 |     Firmware Summary:
158 |     [Basic Info]
159 |     - Name/Version: [Firmware name and version]
160 |     - Device/Type/Arch: [Device model and architecture]
161 |     - Key Info: [Other important information, such as release date, kernel version, etc.]
162 | 
163 |     [Coverage] 
164 |     - Key Dirs: [Key directories analyzed]
165 |     - Key Files: [Key files analyzed]
166 | 
167 |     [Main Issues]
168 |     - Critical Issues: [Location]: Root cause of the issue (Specific technical details like vulnerable code/misconfiguration/insecure functions etc.)
169 |     - Major Issues: [Location]: Root cause of the issue (Specific technical details like vulnerable code/misconfiguration/insecure functions etc.)
170 |     - Other Issues: [Location]: Root cause of the issue (Specific technical details like vulnerable code/misconfiguration/insecure functions etc.)
171 | 
172 |     [Attack Surface]
173 |       Descriptions of the attack chain or specify the exact exploitation method.
174 | 


--------------------------------------------------------------------------------
/firmanalyzer/run.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import yaml
  3 | import time
  4 | import glob
  5 | import logging
  6 | import subprocess
  7 | import argparse
  8 | import configparser
  9 | from pathlib import Path
 10 | from explore import explorer
 11 | from LogManage import LogManager
 12 | 
 13 | 
 14 | def load_binwalk_path():
 15 |     config = configparser.ConfigParser()
 16 |     config_path = os.path.join(os.path.dirname(__file__), 'config.ini')
 17 |     try:
 18 |         config.read(config_path)
 19 |         return config.get('Settings', 'binwalk_path', fallback='/usr/local/bin/binwalk')
 20 |     except Exception as e:
 21 |         logging.warning(f"Failed to load config file, using default binwalk path: {str(e)}")
 22 |         return '/usr/local/bin/binwalk'
 23 | 
 24 | 
 25 | def extract_firmware_with_binwalk(firmware_path: str, extract_root: str) -> str:
 26 |     firmware_name = os.path.splitext(os.path.basename(firmware_path))[0]
 27 |     firmware_extract_path = os.path.join(extract_root, firmware_name)
 28 | 
 29 |     if os.path.exists(firmware_extract_path):
 30 |         import shutil
 31 |         shutil.rmtree(firmware_extract_path)
 32 | 
 33 |     os.makedirs(firmware_extract_path, exist_ok=True)
 34 |     binwalk_path = load_binwalk_path()
 35 | 
 36 |     cmd = f"'{binwalk_path}' -Me '{firmware_path}' --directory '{firmware_extract_path}'"
 37 |     process = subprocess.Popen(cmd, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
 38 |     stdout, stderr = process.communicate()
 39 | 
 40 |     if process.returncode != 0:
 41 |         raise Exception(f"Binwalk extraction failed: {stderr.decode()}")
 42 | 
 43 |     return stdout.decode('utf-8', errors='ignore')
 44 | 
 45 | 
 46 | def find_firmware_root(start_path, required_dirs=None, file_patterns=None, min_score=12):
 47 |     dir_weights = {
 48 |         'bin': 3, 'sbin': 2, 'lib': 3, 'etc': 2, 'usr': 1,
 49 |         'var': 1, 'www': 2, 'system': 2
 50 |     }
 51 |     file_weights = {
 52 |         'bin/sh': 5, 'etc/*.conf': 2, '*.ko': 3,
 53 |         'init': 4, 'bin/busybox': 5, 'usr/lib/*.so': 2
 54 |     }
 55 |     required_dirs = required_dirs or dir_weights
 56 |     file_patterns = file_patterns or file_weights
 57 |     best = {'path': None, 'score': 0, 'depth': 0}
 58 | 
 59 |     def is_standard_fs(root):
 60 |         must_have = ['bin', 'lib']
 61 |         optional = ['etc', 'usr', 'www', 'var']
 62 |         return all(os.path.isdir(os.path.join(root, d)) for d in must_have) and \
 63 |                any(os.path.isdir(os.path.join(root, d)) for d in optional)
 64 | 
 65 |     def is_root_like(root):
 66 |         return any(os.path.isdir(os.path.join(root, d)) for d in ['bin', 'sbin', 'etc'])
 67 | 
 68 |     for root, dirs, _ in os.walk(os.path.normpath(start_path), topdown=False):
 69 |         if is_root_like(root) and is_standard_fs(root):
 70 |             return os.path.normpath(root)
 71 | 
 72 |         dir_score = sum(weight for d, weight in required_dirs.items() if os.path.isdir(os.path.join(root, d)))
 73 |         file_score = sum(weight * len(glob.glob(os.path.join(root, pattern)))
 74 |                          for pattern, weight in file_patterns.items())
 75 |         depth = len(os.path.relpath(root, start_path).split(os.sep))
 76 |         depth_penalty = depth * 0.2
 77 |         total_score = dir_score + file_score - depth_penalty
 78 | 
 79 |         if any(x in root.split(os.sep) for x in {'modules', 'kernel', 'drivers'}):
 80 |             continue
 81 |         if any(term in root.lower() for term in {'extracted', 'unpacked', 'temp'}):
 82 |             total_score *= 0.3
 83 | 
 84 |         if total_score >= min_score and (total_score > best['score'] or 
 85 |            (total_score == best['score'] and depth > best['depth'])):
 86 |             best.update({'path': root, 'score': total_score, 'depth': depth})
 87 | 
 88 |     return best['path'] if best['score'] >= min_score else None
 89 | 
 90 | 
 91 | def analyze_firmware_content(firmware_dir: str, save_path: str, binwalk_report: str = ""):
 92 |     start_time = time.time()
 93 | 
 94 |     if not os.path.isdir(firmware_dir):
 95 |         raise ValueError(f"Invalid firmware directory: {firmware_dir}")
 96 |     os.makedirs(save_path, exist_ok=True)
 97 | 
 98 |     logger = LogManager.get_logger('FirmwareContentAnalyzer', os.path.join(save_path, "explore.log"))
 99 |     logger.info(f"Analyzing firmware in: {firmware_dir}")
100 |     logger.info(f"Saving results to: {save_path}")
101 | 
102 |     with open(os.path.join(os.path.dirname(__file__), 'requirements.yaml'), encoding='utf-8') as f:
103 |         prompts = yaml.safe_load(f)
104 | 
105 |     state = {
106 |         "input": {
107 |             "file_requirements": prompts['file_requirements']['user'],
108 |             "file_findings_requirements": prompts['file_findings_requirements']['user'],
109 |             "directory_requirements": prompts['directory_requirements']['user'],
110 |             "security_report_template": prompts['security_report_template']['user'],
111 |             "summary_template": prompts['summary_template']['user'],
112 |         },
113 |         "current_dir": firmware_dir,
114 |         "base_path": str(Path(firmware_dir)),
115 |         "dir_data": {"files": [], "index": 0, "dir_path": ""},
116 |         "dir_stack": [],
117 |         "response": {"thought": {"file": "", "reason": ""}, "action": "next"},
118 |         "scratchpad": [],
119 |         "observation": "",
120 |         "security_report_summary": binwalk_report[:10000],
121 |         "save_path": save_path
122 |     }
123 | 
124 |     report = explorer(state, max_steps=360)
125 |     logging.info(f"Total analysis time: {time.time() - start_time:.2f} seconds")
126 |     return report
127 | 
128 | 
129 | def process_firmware(input_path: str, output_path: str):
130 |     logger = LogManager.get_logger('FirmwareProcessor')
131 |     firmware_name = os.path.splitext(os.path.basename(input_path))[0]
132 |     base_dir = os.path.join(output_path, firmware_name)
133 |     analysis_dir = os.path.join(base_dir, "log")
134 |     extraction_dir = os.path.join(base_dir, "extracted")
135 | 
136 |     os.makedirs(analysis_dir, exist_ok=True)
137 |     os.makedirs(extraction_dir, exist_ok=True)
138 |     LogManager.setup(analysis_dir)
139 | 
140 |     binwalk_report = ""
141 |     if os.path.isdir(input_path):
142 |         logger.info(f"Analyzing extracted firmware directory: {input_path}")
143 |         root = find_firmware_root(input_path)
144 |     else:
145 |         if not os.path.isfile(input_path):
146 |             raise ValueError(f"Invalid firmware file: {input_path}")
147 |         logger.info(f"Extracting firmware: {input_path} -> {extraction_dir}")
148 |         binwalk_report = extract_firmware_with_binwalk(input_path, extraction_dir)
149 |         root = find_firmware_root(extraction_dir)
150 | 
151 |     if not root:
152 |         raise ValueError("Could not locate valid filesystem root directory")
153 | 
154 |     logger.info(f"Found filesystem root at: {root}")
155 |     return analyze_firmware_content(root, analysis_dir, binwalk_report)
156 | 
157 | 
158 | def main(firmware_path, save_path):
159 |     try:
160 |         report = process_firmware(firmware_path, save_path)
161 |         print(f"\nAnalysis complete. Results saved to: {save_path}")
162 |         return report
163 |     except Exception as e:
164 |         print(f"Error during firmware analysis: {str(e)}")
165 |         raise
166 | 
167 | 
168 | if __name__ == "__main__":
169 |     parser = argparse.ArgumentParser(description='Firmware Analysis Tool')
170 |     parser.add_argument('firmware_path', help='Path to firmware file or extracted firmware directory')
171 |     parser.add_argument('save_path', help='Path to save analysis results')
172 |     args = parser.parse_args()
173 |     main(args.firmware_path, args.save_path)
174 |     


--------------------------------------------------------------------------------
/firmanalyzer/tools.py:
--------------------------------------------------------------------------------
  1 | import re
  2 | import subprocess
  3 | import logging
  4 | import os
  5 | import shutil
  6 | from typing import Dict, List
  7 | from collections import defaultdict
  8 | from math import log2
  9 | 
 10 | logging.basicConfig(
 11 |     level=logging.INFO,
 12 |     format='%(asctime)s [%(levelname)s] %(message)s',
 13 |     handlers=[logging.StreamHandler()]
 14 | )
 15 | 
 16 | PROCESS_TIMEOUT = 30
 17 | MAX_FILE_SIZE = 100 * 1024 * 1024  # 100MB
 18 | 
 19 | VERSION_PATTERNS = [
 20 |     r'(?i)\b(?:v|version)?(?:0|[1-9]\d*[a-z]*)(?:\.(?:0|[1-9]\d*[a-z]*)){1,3}'
 21 |     r'(?:-(?:0|[1-9]\d*|\d*[a-z-][0-9a-z-]*)(?:\.(?:0|[1-9]\d*|\d*[a-z-][0-9a-z-]*))*)?'
 22 |     r'(?:\+[0-9a-z-]+(?:\.[0-9a-z-]+)*)?\b',
 23 |     
 24 |     r'\b(?:20\d{2}(?:[-_./]?(?:0[1-9]|1[0-2]|jan|feb|mar|apr|may|jun|jul|aug|sep|oct|nov|dec))'
 25 |     r'{1,2}(?:[-_./]?(?:0[1-9]|[12][0-9]|3[01]))?)\b',
 26 |     
 27 |     r'(?i)\b(?:build|bld|rev|r|rel|release)[-_]?(?:\d+[a-z]*|\d+\.\d+(?:\.\d+){0,2})\b',
 28 |     
 29 |     r'\b(?:\d+\.){3}\d+\b',
 30 |     
 31 |     r'(?i)\b(?:lib|dll|so|module)[-_]?(?:[a-z0-9]+[-_])?v?\d+(?:\.\d+){1,3}[a-z0-9-]*\b',
 32 |     
 33 |     r'\b(?:0x)?[0-9a-f]{4,8}(?:[-_.][0-9a-f]{4,8}){1,3}\b',
 34 |     
 35 |     r'\b(?:[a-z]+-?)(?:20\d{2}[a-z]?|\d+[a-z]{2,})\b',
 36 |     
 37 |     r'(?i)\b[a-z0-9_-]+[/-]v?\d+\.\d+(?:\.\d+)*[a-z0-9.-]*\b',
 38 |     
 39 |     r'(?i)\bv?\d+\.\d+(?:\.\d+)*[-_]?[a-z]+\d*\b',
 40 |     
 41 |     r'\b\d+\.\d+\.\d+[a-z]+\b'
 42 | ]
 43 | 
 44 | SENSITIVE_PATTERNS = {
 45 |     'password': r'(?i)\b(?:password|passwd|pwd)\s*[:=]\s*["\']?([^\s"\']{8,})["\']?',
 46 |     'api_key': r'(?i)\b(?:api[_-]?key|secret[_-]?key)\s*[:=]\s*["\']?([a-f0-9]{16,}|[A-Za-z0-9+/]{32,})["\']?',
 47 |     'token': r'(?i)\b(?:access[_-]?token|auth[_-]?token|bearer)\s*[:=]\s*["\']?([a-f0-9]{32,}|eyJ[\w-]*\.[\w-]*\.[\w-]*)["\']?',
 48 |     'url': r'(?i)\b(?:https?|ftp)://(?:[^\s:@/]+(?::[^\s@/]*)?@)?(?:[a-z0-9-]+\.)+[a-z]{2,}\b(?:/[^\s"\']*)?',
 49 |     'ip': r'\b(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)(?::\d{1,5})?\b',
 50 |     'email': r'\b[\w.%+-]+@[a-z0-9.-]+\.[a-z]{2,}\b',
 51 |     'firmware_creds': r'(?i)\b(?:admin|root|user)\s*[=:]\s*["\']?(?:admin|root|password|12345|zte521)["\']?',
 52 |     'private_key': r'-----BEGIN (?:RSA|DSA|EC|OPENSSH) PRIVATE KEY-----',
 53 |     'encrypted_data': r'\b(?:AES|DES|3DES|BLOWFISH)[-_]?(?:KEY|IV)\s*[=:]\s*["\']?[0-9a-fA-F]{16,}["\']?',
 54 |     'debug_interface': r'(?i)\b(?:uart|jtag|console)\s*[=:]\s*\d+',
 55 |     'hidden_service': r'(?i)\b(?:backdoor|secret)_(?:port|service)\s*[=:]\s*\d+',
 56 |     'suspicious_path': r'/(?:etc|tmp|var)/(?:passwd|shadow|secret)[^\s"\']*',
 57 |     'base64_data': r'(?:[A-Za-z0-9+/]{4}){20,}(?:[A-Za-z0-9+/]{2}==|[A-Za-z0-9+/]{3}=)?'
 58 | }
 59 | 
 60 | class BinaryAnalyzer:
 61 |     def __init__(self, file_path: str):
 62 |         self.file_path = self._validate_file(file_path)
 63 |         self.strings_cache = None
 64 |         self._common_false_positives = {
 65 |             'example.com', 'localhost', 'test.com', 
 66 |             'dummy', 'test', 'example', 'sample',
 67 |             'changeme', 'placeholder', 'TODO', 'FIXME'
 68 |         }
 69 | 
 70 |     @staticmethod
 71 |     def _validate_file(path: str) -> str:
 72 |         if not os.path.exists(path):
 73 |             raise ValueError(f"File does not exist: {path}")
 74 |         if os.path.islink(path):
 75 |             raise ValueError("Symbolic links are not supported")
 76 |         if not os.path.isfile(path):
 77 |             raise ValueError("Regular file required")
 78 |         if os.path.getsize(path) > MAX_FILE_SIZE:
 79 |             raise ValueError("File size exceeds limit")
 80 |         return os.path.abspath(path)
 81 | 
 82 |     def _get_strings_output(self) -> str:
 83 |         if self.strings_cache is not None:
 84 |             return self.strings_cache
 85 | 
 86 |         try:
 87 |             result = subprocess.run(
 88 |                 ['strings', self.file_path],
 89 |                 stdout=subprocess.PIPE,
 90 |                 stderr=subprocess.PIPE,
 91 |                 timeout=PROCESS_TIMEOUT
 92 |             )
 93 |             if result.returncode != 0:
 94 |                 logging.warning(f"strings command failed: {result.stderr.decode()[:200]}")
 95 |                 return ""
 96 |             
 97 |             self.strings_cache = result.stdout.decode('utf-8', errors='ignore')
 98 |             return self.strings_cache
 99 |         except Exception as e:
100 |             logging.error(f"Failed to execute strings: {str(e)}")
101 |             return ""
102 | 
103 |     def _safe_grep(self, pattern: str, data: str) -> List[Dict[str, str]]:
104 |         try:
105 |             compiled = re.compile(pattern)
106 |             matches = []
107 |             for line in data.splitlines():
108 |                 match = compiled.search(line)
109 |                 if match:
110 |                     matches.append({
111 |                         'line': line,
112 |                         'match': match.group()
113 |                     })
114 |             return matches
115 |         except re.error as e:
116 |             logging.warning(f"Invalid regex pattern {pattern}: {str(e)}")
117 |             return []
118 | 
119 |     def _is_false_positive(self, s: str) -> bool:
120 |         s_lower = s.lower()
121 |         return any(fp in s_lower for fp in self._common_false_positives) or len(set(s)) < 4
122 | 
123 |     def extract_versions(self) -> List[Dict[str, str]]:
124 |         versions = []
125 |         strings_data = self._get_strings_output()
126 |         
127 |         for pattern in VERSION_PATTERNS:
128 |             matches = self._safe_grep(pattern, strings_data)
129 |             for ver in matches:
130 |                 if len(ver['match']) > 4 and not self._is_false_positive(ver['match']):
131 |                     versions.append(ver)
132 |         
133 |         # 按匹配长度排序，并去重
134 |         unique_versions = []
135 |         seen_matches = set()
136 |         for v in sorted(versions, key=lambda x: len(x['match']), reverse=True):
137 |             if v['match'] not in seen_matches:
138 |                 seen_matches.add(v['match'])
139 |                 unique_versions.append(v)
140 |         
141 |         return unique_versions[:20]  # 限制返回数量
142 | 
143 |     def analyze_sensitive_info(self) -> Dict[str, List[Dict[str, str]]]:
144 |         results = defaultdict(list)
145 |         strings_data = self._get_strings_output()
146 |         
147 |         for info_type, pattern in SENSITIVE_PATTERNS.items():
148 |             matches = self._safe_grep(pattern, strings_data)
149 |             filtered = [m for m in matches if not self._is_false_positive(m['match'])]
150 |             
151 |             if info_type == 'base64_data':
152 |                 filtered = [m for m in filtered if self._validate_base64(m['match'])]
153 |             
154 |             results[info_type].extend(filtered[:20])
155 | 
156 |         return dict(results)
157 | 
158 |     def _validate_base64(self, s: str) -> bool:
159 |         import base64
160 |         try:
161 |             if len(s) % 4 != 0:
162 |                 return False
163 |             base64.b64decode(s)
164 |             return True
165 |         except:
166 |             return False
167 | 
168 |     def analyze_elf_info(self) -> Dict[str, List[str]]:
169 |         elf_info = defaultdict(list)
170 |         
171 |         if not shutil.which('objdump'):
172 |             logging.warning("objdump not available, skipping ELF analysis")
173 |             return dict(elf_info)
174 |         
175 |         try:
176 |             section_meta = subprocess.run(
177 |                 ['objdump', '-h', self.file_path],
178 |                 stdout=subprocess.PIPE,
179 |                 timeout=PROCESS_TIMEOUT
180 |             ).stdout.decode(errors='ignore')
181 |             
182 |             section_strategies = {
183 |                 '.rodata': {'min_length': 6, 'filters': [self._is_version_like, self._is_credential_like], 'max_items': 50},
184 |                 '.data': {'min_length': 8, 'filters': [self._is_config_like], 'max_items': 30},
185 |                 '.comment': {'min_length': 4, 'filters': [self._is_compiler_info], 'max_items': 20}
186 |             }
187 |             
188 |             for section, strategy in section_strategies.items():
189 |                 if f"{section} " in section_meta:
190 |                     content = subprocess.run(
191 |                         ['objdump', '-s', '-j', section, self.file_path],
192 |                         stdout=subprocess.PIPE,
193 |                         timeout=PROCESS_TIMEOUT
194 |                     ).stdout.decode(errors='ignore')
195 |                     
196 |                     candidates = self._extract_meaningful_strings(content, strategy['min_length'])
197 |                     filtered = [s.strip() for s in candidates if any(f(s.strip()) for f in strategy['filters'])]
198 |                     if filtered:
199 |                         elf_info[section] = list(dict.fromkeys(filtered))[:strategy['max_items']]
200 |                     
201 |             return dict(elf_info)
202 |         except Exception as e:
203 |             logging.error(f"ELF analysis failed: {str(e)}")
204 |             return dict(elf_info)
205 | 
206 |     def _extract_meaningful_strings(self, content: str, min_length: int = 8) -> List[str]:
207 |         base_strings = re.findall(fr'[\x20-\x7E]{{{min_length},}}', content)
208 |         entropy_filtered = [s for s in base_strings if self._calculate_entropy(s) > 2.5]
209 |         structure_patterns = [
210 |             r'^[A-Za-z0-9][A-Za-z0-9_.+-]*$',
211 |             r'^[A-Za-z]+(?:\s[A-Za-z]+)*$',
212 |             r'^v?\d+\.\d+',
213 |         ]
214 |         return [s for s in entropy_filtered if any(re.match(p, s) for p in structure_patterns)]
215 | 
216 |     def _calculate_entropy(self, s: str) -> float:
217 |         freq = defaultdict(int)
218 |         for c in s:
219 |             freq[c] += 1
220 |         entropy, total = 0.0, len(s)
221 |         for count in freq.values():
222 |             p = count / total
223 |             entropy -= p * log2(p)
224 |         return entropy
225 | 
226 |     def _is_version_like(self, s: str) -> bool:
227 |         return any(re.search(p, s) for p in VERSION_PATTERNS)
228 | 
229 |     def _is_credential_like(self, s: str) -> bool:
230 |         return any(re.search(p, s) for p in SENSITIVE_PATTERNS.values())
231 | 
232 |     def _is_config_like(self, s: str) -> bool:
233 |         config_patterns = [
234 |             r'^[A-Za-z_][A-Za-z0-9_]*=',
235 |             r'^\w+://',
236 |             r'^\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}(?::\d+)?$'
237 |         ]
238 |         return any(re.match(p, s) for p in config_patterns)
239 | 
240 |     def _is_compiler_info(self, s: str) -> bool:
241 |         compiler_keywords = {'GCC', 'clang', 'MSVC', 'build', 'optimize', 'version', 'target', 'configure'}
242 |         return any(kw in s for kw in compiler_keywords)
243 | 
244 |     def full_analysis(self) -> Dict:
245 |         return {
246 |             'file_info': {
247 |                 'path': self.file_path,
248 |                 'size': os.path.getsize(self.file_path),
249 |                 'sha256': self._calculate_hash(),
250 |             },
251 |             'versions': self.extract_versions(),
252 |             'sensitive_info': self.analyze_sensitive_info(),
253 |             'elf_sections': self.analyze_elf_info()
254 |         }
255 | 
256 |     def _calculate_hash(self) -> str:
257 |         try:
258 |             result = subprocess.run(
259 |                 ['sha256sum', self.file_path],
260 |                 stdout=subprocess.PIPE,
261 |                 timeout=PROCESS_TIMEOUT
262 |             )
263 |             return result.stdout.decode().split()[0]
264 |         except Exception as e:
265 |             logging.warning(f"Hash calculation failed: {str(e)}")
266 |             return ""
267 | 
268 | 


--------------------------------------------------------------------------------
/firmcrawler/Examples/dlink/navigation_links.jsonl:
--------------------------------------------------------------------------------
 1 | {"text": "COVR AC2200 Wi-Fi System 2-pack", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-2202-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
 2 | {"text": "COVR-3902-US", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-3902-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
 3 | {"text": "AC3900 Whole Home Wi-Fi System", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-3902-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
 4 | {"text": "COVR-3902-US", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-3902-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
 5 | {"text": "AC3900 Whole Home Wi-Fi System", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-3902-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
 6 | {"text": "DES-1008E", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1330", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
 7 | {"text": "8-Port 10/100 Unmanaged Desktop Switch", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1330", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
 8 | {"text": "DES-105", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1330", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
 9 | {"text": "5 Port 10/100 Desktop Switch", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1330", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
10 | {"text": "DFE-538TX", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1530-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
11 | {"text": "COVR-C1203-US", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-C1203-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
12 | {"text": "Dual Band Whole Home Wi-Fi System", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-C1203-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
13 | {"text": "COVR-C1203-US", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-C1203-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
14 | {"text": "Dual Band Whole Home Wi-Fi System", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-C1203-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
15 | {"text": "COVR-C1213", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-C1213", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
16 | {"text": "Dual Band Whole Home Wi-Fi System", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-C1213", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
17 | {"text": "COVR-L1900", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-L1900", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
18 | {"text": "AC1900 Whole Home Mesh Wi-Fi Router/Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-L1900", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
19 | {"text": "COVR-P2502-US", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-P2502-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
20 | {"text": "Hybrid Powerline Whole Home Mesh Wi-Fi System", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-P2502-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
21 | {"text": "COVR-R2203", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-R2203", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
22 | {"text": "Tri Band Whole Home Mesh Wi-Fi System", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-R2203", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
23 | {"text": "COVR-X1862-CA/COVR-X1863-CA", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-X1862-CA%2FCOVR-X1863-CA", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
24 | {"text": "COVR-X1862-CA/COVR-X1863-CA", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-X1862-CA%2FCOVR-X1863-CA", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
25 | {"text": "AX1800 Mesh Wi-Fi 6 System (2PK & 3PK)", "url": "https://support.dlink.com/ProductInfo.aspx?m=COVR-X1862-CA%2FCOVR-X1863-CA", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
26 | {"text": "DAP-1325", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1325", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
27 | {"text": "N300 Wi-Fi Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1325", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
28 | {"text": "DAP-1325-US", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1325-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
29 | {"text": "Wi-Fi N300 Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1325-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
30 | {"text": "DAP-1610-US", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1610-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
31 | {"text": "AC1200 Wi-Fi Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1610-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
32 | {"text": "DAP-1620", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1620", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
33 | {"text": "AC1200 Wi-Fi Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1620", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
34 | {"text": "DAP-1620-EXO", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1620-EXO", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
35 | {"text": "AC1200 Wi‑Fi Exo Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1620-EXO", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
36 | {"text": "DAP-1650", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1650", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
37 | {"text": "Wireless AC1200 Dual Band Gigabit Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1650", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
38 | {"text": "DAP-1650", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1650", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
39 | {"text": "Wireless AC1200 Dual Band Gigabit Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1650", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
40 | {"text": "DAP-1720", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1720", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
41 | {"text": "AC1750 Wi-Fi Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1720", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
42 | {"text": "DAP-1755-US", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1755-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
43 | {"text": "AC1750 Mesh Wi-Fi Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1755-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
44 | {"text": "DAP-1820-US", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1820-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
45 | {"text": "AC2000 Dual Band Wi-Fi Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1820-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
46 | {"text": "DAP-1950-CA", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1950-CA", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
47 | {"text": "AC1900 High-Performance Mesh Wi-Fi Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1950-CA", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
48 | {"text": "DAP-1955-US", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1955-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
49 | {"text": "AC1900 Mesh Wi-Fi Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-1955-US", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
50 | {"text": "DAP-LX1880-CA", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-LX1880-CA", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
51 | {"text": "AX1800 Mesh Wi-Fi 6 Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-LX1880-CA", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
52 | {"text": "DAP-X1870", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-X1870", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
53 | {"text": "AX1800 Mesh Wi-Fi 6 Range Extender", "url": "https://support.dlink.com/ProductInfo.aspx?m=DAP-X1870", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
54 | {"text": "DCH-S150", "url": "https://support.dlink.com/ProductInfo.aspx?m=DCH-S150", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
55 | {"text": "mydlink Wi-Fi Smart Motion Sensor", "url": "https://support.dlink.com/ProductInfo.aspx?m=DCH-S150", "source_page": "https://support.dlink.com/AllPro.aspx", "original_href": "javascript:void(0);"}
56 | 


--------------------------------------------------------------------------------
/firmcrawler/Examples/dlink/screenshot_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/dlink/screenshot_1.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/dlink/screenshot_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/dlink/screenshot_2.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/dlink/screenshot_3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/dlink/screenshot_3.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/dlink/screenshot_4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/dlink/screenshot_4.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/dlink/screenshot_5.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/dlink/screenshot_5.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/openwrt/screenshot_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/openwrt/screenshot_1.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/openwrt/screenshot_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/openwrt/screenshot_2.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/openwrt/screenshot_3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/openwrt/screenshot_3.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/openwrt/screenshot_4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/openwrt/screenshot_4.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/openwrt/screenshot_5.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/openwrt/screenshot_5.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/tp-link/screenshot_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/tp-link/screenshot_1.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/tp-link/screenshot_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/tp-link/screenshot_2.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/tp-link/screenshot_3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/tp-link/screenshot_3.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/tp-link/screenshot_4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/tp-link/screenshot_4.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/tp-link/screenshot_5.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/tp-link/screenshot_5.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/ui/screenshot_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/ui/screenshot_1.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/ui/screenshot_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/ui/screenshot_2.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/ui/screenshot_3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/ui/screenshot_3.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/ui/screenshot_4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/ui/screenshot_4.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/ui/screenshot_5.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/ui/screenshot_5.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/zyxel/navigation_links.jsonl:
--------------------------------------------------------------------------------
 1 | {"text": "", "url": "https://www.zyxel.com/us/en-us/products/switch/28-port-10gbe-l3-aggregation-switch-xs3800-28", "source_page": "https://selector.zyxel.com/"}
 2 | {"text": "", "url": "https://www.zyxel.com/us/en-us/products/switch/10-12-port-10g-multi-gigabit-lite-l3-smart-managed-switch-xs1930-series", "source_page": "https://selector.zyxel.com/"}
 3 | {"text": "", "url": "https://selector.zyxel.com/type/3", "source_page": "https://selector.zyxel.com/"}
 4 | {"text": "", "url": "https://selector.zyxel.com/type/4", "source_page": "https://selector.zyxel.com/"}
 5 | {"text": "", "url": "https://www.zyxel.com/us/en-us/products/switch/28-port-10gbe-l3-aggregation-switch-xs3800-28", "source_page": "https://selector.zyxel.com/"}
 6 | {"text": "", "url": "https://www.zyxel.com/us/en-us/products/switch/10-12-port-10g-multi-gigabit-lite-l3-smart-managed-switch-xs1930-series", "source_page": "https://selector.zyxel.com/"}
 7 | {"text": "", "url": "https://www.zyxel.com/global/en/products/switch/10-12-port-10g-multi-gigabit-lite-l3-smart-managed-switch-xs1930-series", "source_page": "https://selector.zyxel.com/"}
 8 | {"text": "", "url": "https://selector.zyxel.com/type/3", "source_page": "https://selector.zyxel.com/"}
 9 | {"text": "", "url": "https://selector.zyxel.com/type/4", "source_page": "https://selector.zyxel.com/"}
10 | {"text": "", "url": "https://www.zyxel.com/us/en-us/products/switch/28-port-10gbe-l3-aggregation-switch-xs3800-28", "source_page": "https://selector.zyxel.com/"}
11 | {"text": "", "url": "https://www.zyxel.com/us/en-us/products/switch/10-12-port-10g-multi-gigabit-lite-l3-smart-managed-switch-xs1930-series", "source_page": "https://selector.zyxel.com/"}
12 | {"text": "", "url": "https://www.zyxel.com/global/en/products/switch/10-12-port-10g-multi-gigabit-lite-l3-smart-managed-switch-xs1930-series", "source_page": "https://selector.zyxel.com/"}
13 | {"text": "", "url": "https://selector.zyxel.com/type/3", "source_page": "https://selector.zyxel.com/"}
14 | {"text": "", "url": "https://selector.zyxel.com/type/4", "source_page": "https://selector.zyxel.com/"}
15 | {"text": "", "url": "https://www.zyxel.com/us/en-us/products/switch/28-port-10gbe-l3-aggregation-switch-xs3800-28", "source_page": "https://selector.zyxel.com/"}
16 | {"text": "", "url": "https://www.zyxel.com/us/en-us/products/switch/10-12-port-10g-multi-gigabit-lite-l3-smart-managed-switch-xs1930-series", "source_page": "https://selector.zyxel.com/"}
17 | {"text": "", "url": "https://www.zyxel.com/global/en/products/switch/10-12-port-10g-multi-gigabit-lite-l3-smart-managed-switch-xs1930-series", "source_page": "https://selector.zyxel.com/"}
18 | 


--------------------------------------------------------------------------------
/firmcrawler/Examples/zyxel/screenshot_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/zyxel/screenshot_1.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/zyxel/screenshot_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/zyxel/screenshot_2.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/zyxel/screenshot_3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/zyxel/screenshot_3.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/zyxel/screenshot_4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/zyxel/screenshot_4.png


--------------------------------------------------------------------------------
/firmcrawler/Examples/zyxel/screenshot_5.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/zhang-xr/FirmLLM/8dc567bdfa7fa514f1138725c1195261fc8aa041/firmcrawler/Examples/zyxel/screenshot_5.png


--------------------------------------------------------------------------------
/firmcrawler/README.md:
--------------------------------------------------------------------------------
 1 | ```mermaid
 2 | sequenceDiagram
 3 |     participant User
 4 |     participant Controller
 5 |     participant Inspector
 6 |     participant Explorer
 7 |     participant Scraper
 8 |     
 9 |     User->>Controller: Input target website URL
10 |     Controller->>Inspector: Start page diagnosis
11 |     Inspector-->>Controller: Return SCRAPER/EXPLORER/ALL
12 |     alt SCRAPER mode
13 |         Controller->>Scraper: Execute deep data scraping
14 |         Scraper-->>User: Structured firmware dataset
15 |     else EXPLORER mode
16 |         Controller->>Explorer: Start URL mining
17 |         Explorer-->>Controller: Product URL list
18 |         Controller->>Inspector: Recursive diagnosis for each URL
19 |     else ALL mode
20 |         Controller->>Scraper: Launch data scraping in parallel
21 |         Controller->>Explorer: Synchronously start URL discovery
22 |     end
23 | ```


--------------------------------------------------------------------------------
/firmcrawler/callback.py:
--------------------------------------------------------------------------------
 1 | from langchain_core.callbacks import BaseCallbackHandler
 2 | from typing import Dict, Any
 3 | import json
 4 | class TokenUsageCallbackHandler(BaseCallbackHandler):
 5 |     def __init__(self, save_path):
 6 |         super().__init__()
 7 |         self.total_prompt_tokens = 0
 8 |         self.total_completion_tokens = 0
 9 |         self.total_cost = 0
10 |         self.save_path = save_path
11 |         
12 |     def on_llm_end(self, response: Any, **kwargs: Any) -> None:
13 |         try:
14 |             if hasattr(response, 'llm_output') and response.llm_output:
15 |                 token_usage = response.llm_output.get('token_usage', {})
16 |                 
17 |                 prompt_tokens = token_usage.get('prompt_tokens', 0)
18 |                 completion_tokens = token_usage.get('completion_tokens', 0)
19 |                 
20 |                 input_cost = prompt_tokens * (2.50 / 1_000_000)
21 |                 output_cost = completion_tokens * (10.00 / 1_000_000)
22 |                 
23 |                 self.total_prompt_tokens += prompt_tokens
24 |                 self.total_completion_tokens += completion_tokens
25 |                 self.total_cost += input_cost + output_cost
26 |                 
27 |                 print(f"\n📊 [Token Usage for this call]")
28 |                 print(f"Input tokens: {prompt_tokens:,} (${input_cost:.4f})")
29 |                 print(f"Output tokens: {completion_tokens:,} (${output_cost:.4f})")
30 |                 print(f"Total tokens: {prompt_tokens + completion_tokens:,}")
31 |                 print(f"Running total cost: ${self.total_cost:.4f}")
32 |                 with open(self.save_path, 'w') as f:
33 |                     json.dump({
34 |                         "total_prompt_tokens": self.total_prompt_tokens,
35 |                         "total_completion_tokens": self.total_completion_tokens,
36 |                         "total_cost": self.total_cost
37 |                     }, f)
38 |         except Exception as e:
39 |             print(f"Error in token usage calculation: {str(e)}")
40 |             print("Response structure:", dir(response))
41 |             if hasattr(response, 'llm_output'):
42 |                 print("LLM output:", response.llm_output)


--------------------------------------------------------------------------------
/firmcrawler/mark_page.js:
--------------------------------------------------------------------------------
  1 | const customCSS = `
  2 |         ::-webkit-scrollbar {
  3 |             width: 10px;
  4 |         }
  5 |         ::-webkit-scrollbar-track {
  6 |             background: #27272a;
  7 |         }
  8 |         ::-webkit-scrollbar-thumb {
  9 |             background: #888;
 10 |             border-radius: 0.375rem;
 11 |         }
 12 |         ::-webkit-scrollbar-thumb:hover {
 13 |             background: #555;
 14 |         }
 15 |     `;
 16 | 
 17 |     const styleTag = document.createElement("style");
 18 |     styleTag.textContent = customCSS;
 19 |     document.head.append(styleTag);
 20 | 
 21 |     let labels = [];
 22 | 
 23 |     function unmarkPage() {
 24 |     // Unmark page logic
 25 |     for (const label of labels) {
 26 |         document.body.removeChild(label);
 27 |     }
 28 |     labels = [];
 29 |     }
 30 | 
 31 |     function markPage() {
 32 |     unmarkPage();
 33 | 
 34 |     var bodyRect = document.body.getBoundingClientRect();
 35 | 
 36 |     var items = Array.prototype.slice
 37 |         .call(document.querySelectorAll("*"))
 38 |         .map(function (element) {
 39 |         var vw = Math.max(
 40 |             document.documentElement.clientWidth || 0,
 41 |             window.innerWidth || 0
 42 |         );
 43 |         var vh = Math.max(
 44 |             document.documentElement.clientHeight || 0,
 45 |             window.innerHeight || 0
 46 |         );
 47 |         var textualContent = element.textContent.trim().replace(/\s{2,}/g, " ");
 48 |         var elementType = element.tagName.toLowerCase();
 49 |         var ariaLabel = element.getAttribute("aria-label") || "";
 50 | 
 51 |         var rects = [...element.getClientRects()]
 52 |             .filter((bb) => {
 53 |             var center_x = bb.left + bb.width / 2;
 54 |             var center_y = bb.top + bb.height / 2;
 55 |             var elAtCenter = document.elementFromPoint(center_x, center_y);
 56 | 
 57 |             return elAtCenter === element || element.contains(elAtCenter);
 58 |             })
 59 |             .map((bb) => {
 60 |             const rect = {
 61 |                 left: Math.max(0, bb.left),
 62 |                 top: Math.max(0, bb.top),
 63 |                 right: Math.min(vw, bb.right),
 64 |                 bottom: Math.min(vh, bb.bottom),
 65 |             };
 66 |             return {
 67 |                 ...rect,
 68 |                 width: rect.right - rect.left,
 69 |                 height: rect.bottom - rect.top,
 70 |             };
 71 |             });
 72 | 
 73 |         var area = rects.reduce((acc, rect) => acc + rect.width * rect.height, 0);
 74 | 
 75 |         return {
 76 |             element: element,
 77 |             include:
 78 |             element.tagName === "SELECT" ||
 79 |             element.tagName === "BUTTON" ||
 80 |             element.tagName === "A" ||
 81 |             element.onclick != null ||
 82 |             window.getComputedStyle(element).cursor == "pointer" ||
 83 |             element.tagName === "IFRAME",
 84 |             area,
 85 |             rects,
 86 |             text: textualContent,
 87 |             type: elementType,
 88 |             ariaLabel: ariaLabel,
 89 |         };
 90 |         })
 91 |         .filter((item) => item.include && item.area >= 80);
 92 | 
 93 |     // Only keep inner clickable items
 94 |     items = items.filter(
 95 |         (x) => !items.some((y) => x.element.contains(y.element) && !(x == y))
 96 |     );
 97 |     // Color scheme to distinguish valid links and normal A tags
 98 |     const COLOR_SCHEME = {
 99 |         'a-link': "#FF4444",     // Valid links in red
100 |         'a': "#FFA07A",          // Normal A tags in light red
101 |         'button': "#4CAF50",     // Buttons in green
102 |         'select': "#9C27B0",     // Select boxes in purple
103 |         'iframe': "#2196F3",     // Iframes in blue
104 |         'clickable': "#FF9800",  // Other clickable elements in orange
105 |     };
106 |     // Modify color logic in items.forEach
107 |     items.forEach(function (item, index) {
108 |         item.rects.forEach((bbox) => {
109 |             newElement = document.createElement("div");
110 |             
111 |             // Get element type and color
112 |             const elementType = item.element.tagName.toLowerCase();
113 |             let borderColor;
114 |             
115 |             if (elementType === 'a') {
116 |                 // Check if it's a valid link
117 |                 const href = item.element.getAttribute('href');
118 |                 const isValidLink = href && href !== '#' && href !== '';
119 |                 borderColor = isValidLink ? COLOR_SCHEME['a-link'] : COLOR_SCHEME['a'];
120 |             } else {
121 |                 borderColor = COLOR_SCHEME[elementType] || 
122 |                              (item.element.onclick || window.getComputedStyle(item.element).cursor === "pointer" 
123 |                               ? COLOR_SCHEME.clickable 
124 |                               : "#757575");
125 |             }
126 |             
127 |             newElement.style.outline = `1px dashed ${borderColor}`;
128 |             newElement.style.position = "fixed";
129 |             newElement.style.left = bbox.left + "px";
130 |             newElement.style.top = bbox.top + "px";
131 |             newElement.style.width = bbox.width + "px";
132 |             newElement.style.height = bbox.height + "px";
133 |             newElement.style.pointerEvents = "none";
134 |             newElement.style.boxSizing = "border-box";
135 |             newElement.style.zIndex = 2147483647;
136 | 
137 |             // Use the same color for the label
138 |             var label = document.createElement("span");
139 |             label.textContent = index;
140 |             label.style.position = "absolute";
141 |             label.style.top = "-19px";
142 |             label.style.left = "0px";
143 |             label.style.background = borderColor;
144 |             label.style.color = "white";
145 |             label.style.padding = "2px 4px";
146 |             label.style.fontSize = "12px";
147 |             label.style.borderRadius = "2px";
148 |             newElement.appendChild(label);
149 | 
150 |             document.body.appendChild(newElement);
151 |             labels.push(newElement);
152 |         });
153 |     });
154 |     const coordinates = items.flatMap((item) =>
155 |         item.rects.map(({ left, top, width, height }) => ({
156 |         x: (left + left + width) / 2,
157 |         y: (top + top + height) / 2,
158 |         type: item.type,
159 |         text: item.text,
160 |         ariaLabel: item.ariaLabel,
161 |         }))
162 |     );
163 |     return coordinates;
164 |     }
165 | 


--------------------------------------------------------------------------------
/firmcrawler/prompts/dlink.yaml:
--------------------------------------------------------------------------------
  1 | inspector:
  2 |   user: |
  3 |     Workflow Examples:
  4 |     {{
  5 |         "thought": "Found direct firmware download links (.bin files) with version numbers",
  6 |         "action": "ANSWER SCRAPER",
  7 |         "status": "complete",
  8 |         "next_step": "Direct download links found, suitable for Scraper"
  9 |     }}
 10 |     {{
 11 |         "thought": "Page shows product list with 'Download' section for each, but needs additional navigation",
 12 |         "action": "ANSWER EXPLORER",
 13 |         "status": "complete",
 14 |         "next_step": "Multiple products with download sections need exploration"
 15 |     }}
 16 |     {{
 17 |         "thought": "Page contains both product info and firmware download section",
 18 |         "action": "ANSWER ALL",
 19 |         "status": "complete",
 20 |         "next_step": "Mixed content needs both Scraper and Explorer"
 21 |     }}
 22 |     {{
 23 |         "thought": "Found firmware table with version info but download links need verification",
 24 |         "action": "ANSWER ALL",
 25 |         "status": "complete",
 26 |         "next_step": "Firmware info present but needs further processing"
 27 |     }}
 28 |     {{
 29 |         "thought": "Page shows product specs with firmware update button",
 30 |         "action": "ANSWER ALL",
 31 |         "status": "complete",
 32 |         "next_step": "Contains both product info and firmware update option"
 33 |     }}
 34 |     {{
 35 |         "thought": "Download section visible but links go to selection page",
 36 |         "action": "ANSWER EXPLORER",
 37 |         "status": "complete",
 38 |         "next_step": "Downloads require further navigation"
 39 |     }}
 40 | 
 41 | # URL explorer - Collects product page URLs
 42 | explorer:
 43 |   user: |
 44 |     Workflow Examples:
 45 |     {{
 46 |         "thought": "Starting from page top, collecting initial viewport links",
 47 |         "action": "GET_NAVIGATION_LINKS 1,2,3,4,5",
 48 |         "status": "continue",
 49 |         "next_step": "After collecting initial links, scroll for more content"
 50 |     }}
 51 |     {{
 52 |         "thought": "Current viewport processed, scrolling down for more content",
 53 |         "action": "SCROLL WINDOW; down",
 54 |         "status": "continue",
 55 |         "next_step": "Wait for new content to load after scrolling"
 56 |     }}
 57 |     {{
 58 |         "thought": "Waiting for new content to load after scroll",
 59 |         "action": "WAIT 2",
 60 |         "status": "continue",
 61 |         "next_step": "Process newly visible links in viewport"
 62 |     }}
 63 |     {{
 64 |         "thought": "Processing next set of links in new viewport",
 65 |         "action": "GET_NAVIGATION_LINKS 6,7,8,9,10",
 66 |         "status": "continue",
 67 |         "next_step": "Check for more content by scrolling"
 68 |     }}
 69 |     {{
 70 |         "thought": "Scrolling to check for more content",
 71 |         "action": "SCROLL WINDOW; down",
 72 |         "status": "continue",
 73 |         "next_step": "Wait to verify if new content appears"
 74 |     }}
 75 |     {{
 76 |         "thought": "Waiting to verify no new content",
 77 |         "action": "WAIT 2",
 78 |         "status": "continue",
 79 |         "next_step": "Perform final scroll to confirm bottom"
 80 |     }}
 81 |     {{
 82 |         "thought": "Performing final scroll to confirm bottom reached",
 83 |         "action": "SCROLL WINDOW; down",
 84 |         "status": "continue",
 85 |         "next_step": "Wait for final verification"
 86 |     }}
 87 |     {{
 88 |         "thought": "Verification complete: Bottom reached, no new content, all links collected",
 89 |         "action": "ANSWER task completion status",
 90 |         "status": "complete",
 91 |         "next_step": "Task finished, all links collected"
 92 |     }}
 93 | scraper:
 94 |   user: |
 95 |     Note that you start from the top of the page, so no need to scroll up. Make sure to reach the bottom before submitting ANSWER.
 96 |     Begin scrolling down to load all content. Process each viewport systematically.
 97 | 
 98 |     Example workflow:
 99 |     {{
100 |         "thought": "Starting from page top, scanning for firmware download sections",
101 |         "action": "GET_NAVIGATION_LINKS 1,2,3",
102 |         "status": "continue",
103 |         "next_step": "After collecting current info, scroll down for more content"
104 |     }}
105 | 
106 |     {{
107 |         "thought": "Firmware info from current viewport collected, continuing down",
108 |         "action": "SCROLL WINDOW; down",
109 |         "status": "continue",
110 |         "next_step": "Process newly visible firmware info"
111 |     }}
112 | 
113 |     {{
114 |         "thought": "Reached page bottom, all firmware info collected",
115 |         "action": "ANSWER {collected_firmware_info}",
116 |         "status": "complete",
117 |         "next_step": "Task complete, all firmware info gathered"
118 |     }}
119 | 


--------------------------------------------------------------------------------
/firmcrawler/prompts/foscam.yaml:
--------------------------------------------------------------------------------
  1 | inspector:
  2 |   user: |
  3 |     Workflow Examples:
  4 |     {{
  5 |         "thought": "Found direct firmware download links (.bin files) with version numbers",
  6 |         "action": "ANSWER SCRAPER",
  7 |         "status": "complete",
  8 |         "next_step": "Direct download links found, suitable for Scraper"
  9 |     }}
 10 |     {{
 11 |         "thought": "Page shows product list with 'Download' section for each, but needs additional navigation",
 12 |         "action": "ANSWER EXPLORER",
 13 |         "status": "complete",
 14 |         "next_step": "Multiple products with download sections need exploration"
 15 |     }}
 16 |     {{
 17 |         "thought": "Page contains both product info and firmware download section",
 18 |         "action": "ANSWER ALL",
 19 |         "status": "complete",
 20 |         "next_step": "Mixed content needs both Scraper and Explorer"
 21 |     }}
 22 |     {{
 23 |         "thought": "Found firmware table with version info but download links need verification",
 24 |         "action": "ANSWER ALL",
 25 |         "status": "complete",
 26 |         "next_step": "Firmware info present but needs further processing"
 27 |     }}
 28 |     {{
 29 |         "thought": "Page shows product specs with firmware update button",
 30 |         "action": "ANSWER ALL",
 31 |         "status": "complete",
 32 |         "next_step": "Contains both product info and firmware update option"
 33 |     }}
 34 |     {{
 35 |         "thought": "Download section visible but links go to selection page",
 36 |         "action": "ANSWER EXPLORER",
 37 |         "status": "complete",
 38 |         "next_step": "Downloads require further navigation"
 39 |     }}
 40 | 
 41 | explorer:
 42 |   user: |
 43 |     Important Task Requirements:
 44 |     - Must scroll to top of page when entering any new page
 45 |     - Must process all product images and their corresponding navigation links
 46 |     - Must scroll to the absolute bottom of each page
 47 |     - Must perform multiple scroll verifications to confirm true bottom is reached
 48 |     - Must ONLY click "Next Page" button (NEVER click "Previous Page")
 49 |     - Must process pages in forward order only (from first page to last page)
 50 |     - Must process content from top to bottom on each page
 51 |     - Only complete task after confirming no more content and no next page exists
 52 |     
 53 |     Workflow Examples:
 54 |     {{
 55 |         "thought": "Start by ensuring we're at the top of the page",
 56 |         "action": "SCROLL WINDOW; up",
 57 |         "status": "continue",
 58 |         "next_step": "Begin processing from page top"
 59 |     }}
 60 |     {{
 61 |         "thought": "Start scrolling down to load initial content",
 62 |         "action": "SCROLL WINDOW; down",
 63 |         "status": "continue",
 64 |         "next_step": "Wait for content to load then collect first set of product links"
 65 |     }}
 66 |     {{
 67 |         "thought": "Processing first group of product images and their navigation links",
 68 |         "action": "GET_NAVIGATION_LINKS 1,2,3,4,5",
 69 |         "status": "continue",
 70 |         "next_step": "Scroll down to check for more products"
 71 |     }}
 72 |     {{
 73 |         "thought": "More products visible, scroll to load them completely",
 74 |         "action": "SCROLL WINDOW; down",
 75 |         "status": "continue",
 76 |         "next_step": "Process next group of product links"
 77 |     }}
 78 |     {{
 79 |         "thought": "Getting next set of product navigation links",
 80 |         "action": "GET_NAVIGATION_LINKS 6,7,8,9,10",
 81 |         "status": "continue",
 82 |         "next_step": "Continue scrolling to check for more content"
 83 |     }}
 84 |     {{
 85 |         "thought": "Scroll to check for more content and next page button",
 86 |         "action": "SCROLL WINDOW; down",
 87 |         "status": "continue",
 88 |         "next_step": "Verify if next page exists"
 89 |     }}
 90 |     {{
 91 |         "thought": "Found next page button (element 11), verifying it's 'Next' not 'Previous'",
 92 |         "action": "VERIFY_TEXT 11 'next'",
 93 |         "status": "continue",
 94 |         "next_step": "Click next page if verified"
 95 |     }}
 96 |     {{
 97 |         "thought": "Confirmed it's next page button, clicking to proceed",
 98 |         "action": "CLICK 11",
 99 |         "status": "continue",
100 |         "next_step": "Wait for new page to load then scroll to top"
101 |     }}
102 |     {{
103 |         "thought": "New page loaded, scrolling back to top before processing",
104 |         "action": "SCROLL WINDOW; up",
105 |         "status": "continue",
106 |         "next_step": "Begin processing new page from top"
107 |     }}
108 |     {{
109 |         "thought": "No next page found, performing additional scroll to verify bottom",
110 |         "action": "SCROLL WINDOW; down",
111 |         "status": "continue",
112 |         "next_step": "Double check we reached true bottom"
113 |     }}
114 |     {{
115 |         "thought": "Performing final verification scroll",
116 |         "action": "SCROLL WINDOW; down",
117 |         "status": "continue",
118 |         "next_step": "Confirm no more content or next page button"
119 |     }}
120 |     {{
121 |         "thought": "Multiple scrolls confirm true bottom reached, no next page found",
122 |         "action": "ANSWER All pages processed successfully, confirmed no more content",
123 |         "status": "complete",
124 |         "next_step": "Task complete, collected all product links from all pages"
125 |     }}
126 | scraper:
127 |   user: |
128 |     Note that you start from the top of the page, so no need to scroll up. Make sure to reach the bottom before submitting ANSWER.
129 |     Begin scrolling down to load all content. Process each viewport systematically.
130 | 
131 |     Example workflow:
132 |     {{
133 |         "thought": "Starting from page top, scanning for firmware download sections",
134 |         "action": "GET_NAVIGATION_LINKS 1,2,3",
135 |         "status": "continue",
136 |         "next_step": "After collecting current info, scroll down for more content"
137 |     }}
138 | 
139 |     {{
140 |         "thought": "Firmware info from current viewport collected, continuing down",
141 |         "action": "SCROLL WINDOW; down",
142 |         "status": "continue",
143 |         "next_step": "Process newly visible firmware info"
144 |     }}
145 | 
146 |     {{
147 |         "thought": "Reached page bottom, all firmware info collected",
148 |         "action": "ANSWER {collected_firmware_info}",
149 |         "status": "complete",
150 |         "next_step": "Task complete, all firmware info gathered"
151 |     }}
152 | 


--------------------------------------------------------------------------------
/firmcrawler/prompts/ui.yaml:
--------------------------------------------------------------------------------
  1 | inspector:
  2 |   user: |
  3 |     Workflow Examples:
  4 |     {{
  5 |         "thought": "Found direct firmware download links (.bin files) with version numbers",
  6 |         "action": "ANSWER SCRAPER",
  7 |         "status": "complete",
  8 |         "next_step": "Direct download links found, suitable for Scraper"
  9 |     }}
 10 |     {{
 11 |         "thought": "Page shows product list with 'Download' section for each, but needs additional navigation",
 12 |         "action": "ANSWER EXPLORER",
 13 |         "status": "complete",
 14 |         "next_step": "Multiple products with download sections need exploration"
 15 |     }}
 16 |     {{
 17 |         "thought": "Page contains both product info and firmware download section",
 18 |         "action": "ANSWER ALL",
 19 |         "status": "complete",
 20 |         "next_step": "Mixed content needs both Scraper and Explorer"
 21 |     }}
 22 |     {{
 23 |         "thought": "Found firmware table with version info but download links need verification",
 24 |         "action": "ANSWER ALL",
 25 |         "status": "complete",
 26 |         "next_step": "Firmware info present but needs further processing"
 27 |     }}
 28 |     {{
 29 |         "thought": "Page shows product specs with firmware update button",
 30 |         "action": "ANSWER ALL",
 31 |         "status": "complete",
 32 |         "next_step": "Contains both product info and firmware update option"
 33 |     }}
 34 |     {{
 35 |         "thought": "Download section visible but links go to selection page",
 36 |         "action": "ANSWER EXPLORER",
 37 |         "status": "complete",
 38 |         "next_step": "Downloads require further navigation"
 39 |     }}
 40 | explorer:
 41 |   user: |
 42 |     Workflow Examples:
 43 |     {{
 44 |         "thought": "Start scrolling down to load all content",
 45 |         "action": "SCROLL WINDOW; down",
 46 |         "status": "continue",
 47 |         "next_step": "Check for initial viewport links after scrolling"
 48 |     }}
 49 |     {{
 50 |         "thought": "Starting from page top, collect initial viewport links",
 51 |         "action": "GET_NAVIGATION_LINKS 1,2,3,4,5",
 52 |         "status": "continue",
 53 |         "next_step": "After collecting links, scroll for more content"
 54 |     }}
 55 |     {{
 56 |         "thought": "Current viewport processed, scroll down to see more content",
 57 |         "action": "SCROLL WINDOW; down",
 58 |         "status": "continue",
 59 |         "next_step": "Wait for new content to load"
 60 |     }}
 61 |     {{
 62 |         "thought": "Process next group of links in new viewport",
 63 |         "action": "GET_NAVIGATION_LINKS 6,7,8,9,10",
 64 |         "status": "continue",
 65 |         "next_step": "Check for more content by scrolling"
 66 |     }}
 67 |     {{
 68 |         "thought": "Scroll to check for more content",
 69 |         "action": "SCROLL WINDOW; down",
 70 |         "status": "continue",
 71 |         "next_step": "Wait to verify if new content appears"
 72 |     }}
 73 |     {{
 74 |         "thought": "Perform final scroll to confirm bottom reached",
 75 |         "action": "SCROLL WINDOW; down",
 76 |         "status": "continue",
 77 |         "next_step": "Verify all content processed"
 78 |     }}
 79 |     {{
 80 |         "thought": "Verification complete: reached bottom, no new content, all links collected",
 81 |         "action": "ANSWER Task completed",
 82 |         "status": "complete",
 83 |         "next_step": "Task finished, all links collected"
 84 |     }}
 85 | 
 86 | scraper:
 87 |   user: |
 88 |     Note that you start from the top of the page, so no need to scroll up. Make sure to reach the bottom before submitting ANSWER.
 89 |     Begin scrolling down to load all content. Process each viewport systematically.
 90 | 
 91 |     Example workflow:
 92 |     {{
 93 |         "thought": "Starting from page top, scanning for firmware download sections",
 94 |         "action": "GET_NAVIGATION_LINKS 1,2,3",
 95 |         "status": "continue",
 96 |         "next_step": "After collecting current info, scroll down for more content"
 97 |     }}
 98 | 
 99 |     {{
100 |         "thought": "Firmware info from current viewport collected, continuing down",
101 |         "action": "SCROLL WINDOW; down",
102 |         "status": "continue",
103 |         "next_step": "Process newly visible firmware info"
104 |     }}
105 | 
106 |     {{
107 |         "thought": "Reached page bottom, all firmware info collected",
108 |         "action": "ANSWER {collected_firmware_info}",
109 |         "status": "complete",
110 |         "next_step": "Task complete, all firmware info gathered"
111 |     }}
112 | 


--------------------------------------------------------------------------------