Add files via upload

2026-02-12 14:02:45 +00:00 · 2026-01-14 15:58:19 -03:00
parent 866bb455d7
commit 4b9b0d22be
20 changed files with 76469 additions and 307 deletions
--- a/core/context_builder.py
+++ b/core/context_builder.py
@@ -0,0 +1,468 @@
+#!/usr/bin/env python3
+"""
+Context Builder - Consolidates all recon outputs into a single file for LLM consumption
+
+This module aggregates results from all reconnaissance tools into a single
+consolidated file that will be used by the LLM to enhance testing capabilities.
+"""
+
+import json
+import os
+from datetime import datetime
+from pathlib import Path
+from typing import Dict, List, Any, Set, Optional
+from urllib.parse import urlparse
+import logging
+
+logger = logging.getLogger(__name__)
+
+
+class ReconContextBuilder:
+    """
+    Consolidates all reconnaissance data into a single context for LLM consumption.
+
+    Generates consolidated files:
+    - consolidated_context.json - Complete JSON with all data
+    - consolidated_context.txt - Text version for direct LLM consumption
+    """
+
+    def __init__(self, output_dir: str = "results"):
+        """Initialize the builder."""
+        self.output_dir = Path(output_dir)
+        self.output_dir.mkdir(parents=True, exist_ok=True)
+
+        # Collected data
+        self.target_info: Dict[str, Any] = {}
+        self.subdomains: Set[str] = set()
+        self.live_hosts: Set[str] = set()
+        self.urls: Set[str] = set()
+        self.urls_with_params: Set[str] = set()
+        self.open_ports: List[Dict] = []
+        self.technologies: List[str] = []
+        self.vulnerabilities: List[Dict] = []
+        self.dns_records: List[str] = []
+        self.js_files: Set[str] = set()
+        self.api_endpoints: Set[str] = set()
+        self.interesting_paths: Set[str] = set()
+        self.secrets: List[str] = []
+        self.raw_outputs: Dict[str, str] = {}
+        self.tool_results: Dict[str, Dict] = {}
+
+    def set_target(self, target: str, target_type: str = "domain"):
+        """Set the primary target."""
+        self.target_info = {
+            "primary_target": target,
+            "type": target_type,
+            "timestamp": datetime.now().isoformat()
+        }
+
+        # Auto-add as in-scope
+        if target_type == "domain":
+            self.subdomains.add(target)
+        elif target_type == "url":
+            parsed = urlparse(target)
+            if parsed.netloc:
+                self.subdomains.add(parsed.netloc)
+                self.live_hosts.add(target)
+
+    def add_subdomains(self, subdomains: List[str]):
+        """Add discovered subdomains."""
+        for sub in subdomains:
+            sub = sub.strip().lower()
+            if sub and self._is_valid_domain(sub):
+                self.subdomains.add(sub)
+
+    def add_live_hosts(self, hosts: List[str]):
+        """Add active HTTP hosts."""
+        for host in hosts:
+            host = host.strip()
+            if host:
+                self.live_hosts.add(host)
+
+    def add_urls(self, urls: List[str]):
+        """Add discovered URLs."""
+        for url in urls:
+            url = url.strip()
+            if url and url.startswith(('http://', 'https://')):
+                self.urls.add(url)
+                # Separate URLs with parameters
+                if '?' in url and '=' in url:
+                    self.urls_with_params.add(url)
+
+    def add_open_ports(self, ports: List[Dict]):
+        """Add discovered open ports."""
+        for port in ports:
+            if port not in self.open_ports:
+                self.open_ports.append(port)
+
+    def add_technologies(self, techs: List[str]):
+        """Add detected technologies."""
+        for tech in techs:
+            if tech and tech not in self.technologies:
+                self.technologies.append(tech)
+
+    def add_vulnerabilities(self, vulns: List[Dict]):
+        """Add found vulnerabilities."""
+        for vuln in vulns:
+            if vuln not in self.vulnerabilities:
+                self.vulnerabilities.append(vuln)
+
+    def add_dns_records(self, records: List[str]):
+        """Add DNS records."""
+        for record in records:
+            if record and record not in self.dns_records:
+                self.dns_records.append(record)
+
+    def add_js_files(self, js_urls: List[str]):
+        """Add found JavaScript files."""
+        for js in js_urls:
+            if js and '.js' in js.lower():
+                self.js_files.add(js)
+
+    def add_api_endpoints(self, endpoints: List[str]):
+        """Add API endpoints."""
+        for ep in endpoints:
+            if ep:
+                self.api_endpoints.add(ep)
+
+    def add_interesting_paths(self, paths: List[str]):
+        """Add interesting paths."""
+        keywords = ['admin', 'login', 'dashboard', 'api', 'config', 'backup',
+                   'debug', 'test', 'dev', 'staging', 'internal', 'upload',
+                   'console', 'panel', 'phpinfo', 'swagger', '.git', '.env']
+
+        for path in paths:
+            path_lower = path.lower()
+            if any(kw in path_lower for kw in keywords):
+                self.interesting_paths.add(path)
+
+    def add_secrets(self, secrets: List[str]):
+        """Add potential secrets found."""
+        for secret in secrets:
+            if secret and secret not in self.secrets:
+                self.secrets.append(secret)
+
+    def add_raw_output(self, tool_name: str, output: str):
+        """Add raw output from a tool."""
+        self.raw_outputs[tool_name] = output
+
+    def add_tool_result(self, tool_name: str, result: Dict):
+        """Add structured result from a tool."""
+        self.tool_results[tool_name] = result
+
+    def _is_valid_domain(self, domain: str) -> bool:
+        """Check if it's a valid domain."""
+        if not domain or '..' in domain or domain.startswith('.'):
+            return False
+        parts = domain.split('.')
+        return len(parts) >= 2 and all(p for p in parts)
+
+    def _extract_params_from_urls(self) -> Dict[str, List[str]]:
+        """Extract unique parameters from URLs."""
+        params = {}
+        for url in self.urls_with_params:
+            if '?' in url:
+                query = url.split('?')[1]
+                for pair in query.split('&'):
+                    if '=' in pair:
+                        param_name = pair.split('=')[0]
+                        if param_name not in params:
+                            params[param_name] = []
+                        params[param_name].append(url)
+        return params
+
+    def _categorize_vulnerabilities(self) -> Dict[str, List[Dict]]:
+        """Categorize vulnerabilities by severity."""
+        categories = {
+            'critical': [],
+            'high': [],
+            'medium': [],
+            'low': [],
+            'info': []
+        }
+
+        for vuln in self.vulnerabilities:
+            severity = vuln.get('severity', 'info').lower()
+            if severity in categories:
+                categories[severity].append(vuln)
+
+        return categories
+
+    def _build_attack_surface(self) -> Dict[str, Any]:
+        """Build attack surface summary."""
+        return {
+            "total_subdomains": len(self.subdomains),
+            "live_hosts": len(self.live_hosts),
+            "total_urls": len(self.urls),
+            "urls_with_params": len(self.urls_with_params),
+            "open_ports": len(self.open_ports),
+            "js_files": len(self.js_files),
+            "api_endpoints": len(self.api_endpoints),
+            "interesting_paths": len(self.interesting_paths),
+            "technologies_detected": len(self.technologies),
+            "vulnerabilities_found": len(self.vulnerabilities),
+            "secrets_found": len(self.secrets)
+        }
+
+    def _build_recommendations(self) -> List[str]:
+        """Generate recommendations based on findings."""
+        recs = []
+
+        vuln_cats = self._categorize_vulnerabilities()
+
+        if vuln_cats['critical']:
+            recs.append(f"CRITICAL: {len(vuln_cats['critical'])} critical vulnerabilities found - immediate action required!")
+
+        if vuln_cats['high']:
+            recs.append(f"HIGH: {len(vuln_cats['high'])} high severity vulnerabilities need attention.")
+
+        if self.urls_with_params:
+            recs.append(f"Test {len(self.urls_with_params)} URLs with parameters for SQLi, XSS, etc.")
+
+        if self.api_endpoints:
+            recs.append(f"Review {len(self.api_endpoints)} API endpoints for authentication/authorization issues.")
+
+        if self.secrets:
+            recs.append(f"SECRETS: {len(self.secrets)} potential secrets exposed - rotate credentials!")
+
+        if self.interesting_paths:
+            recs.append(f"Investigate {len(self.interesting_paths)} interesting paths found.")
+
+        if len(self.live_hosts) > 50:
+            recs.append("Large attack surface detected - consider network segmentation.")
+
+        return recs
+
+    def build(self) -> Dict[str, Any]:
+        """Build the consolidated context."""
+        logger.info("Building consolidated context for LLM...")
+
+        context = {
+            "metadata": {
+                "generated_at": datetime.now().isoformat(),
+                "generator": "NeuroSploit Recon",
+                "version": "2.0.0"
+            },
+            "target": self.target_info,
+            "attack_surface": self._build_attack_surface(),
+            "data": {
+                "subdomains": sorted(list(self.subdomains)),
+                "live_hosts": sorted(list(self.live_hosts)),
+                "urls": {
+                    "all": list(self.urls)[:500],
+                    "with_params": list(self.urls_with_params),
+                    "total_count": len(self.urls)
+                },
+                "open_ports": self.open_ports,
+                "technologies": self.technologies,
+                "dns_records": self.dns_records,
+                "js_files": list(self.js_files),
+                "api_endpoints": list(self.api_endpoints),
+                "interesting_paths": list(self.interesting_paths),
+                "unique_params": self._extract_params_from_urls(),
+                "secrets": self.secrets[:50]
+            },
+            "vulnerabilities": {
+                "total": len(self.vulnerabilities),
+                "by_severity": self._categorize_vulnerabilities(),
+                "all": self.vulnerabilities[:100]
+            },
+            "recommendations": self._build_recommendations(),
+            "tool_results": self.tool_results
+        }
+
+        return context
+
+    def build_text_context(self) -> str:
+        """Build context in text format for LLM."""
+        ctx = self.build()
+
+        lines = [
+            "=" * 80,
+            "NEUROSPLOIT - CONSOLIDATED RECONNAISSANCE CONTEXT",
+            "=" * 80,
+            "",
+            f"Primary Target: {ctx['target'].get('primary_target', 'N/A')}",
+            f"Generated at: {ctx['metadata']['generated_at']}",
+            "",
+            "-" * 40,
+            "ATTACK SURFACE",
+            "-" * 40,
+        ]
+
+        for key, value in ctx['attack_surface'].items():
+            lines.append(f"  {key}: {value}")
+
+        lines.extend([
+            "",
+            "-" * 40,
+            "DISCOVERED SUBDOMAINS",
+            "-" * 40,
+        ])
+        for sub in ctx['data']['subdomains'][:50]:
+            lines.append(f"  - {sub}")
+        if len(ctx['data']['subdomains']) > 50:
+            lines.append(f"  ... and {len(ctx['data']['subdomains']) - 50} more")
+
+        lines.extend([
+            "",
+            "-" * 40,
+            "LIVE HOSTS (HTTP)",
+            "-" * 40,
+        ])
+        for host in ctx['data']['live_hosts'][:30]:
+            lines.append(f"  - {host}")
+
+        lines.extend([
+            "",
+            "-" * 40,
+            "OPEN PORTS",
+            "-" * 40,
+        ])
+        for port in ctx['data']['open_ports'][:30]:
+            lines.append(f"  - {port.get('port', 'N/A')}/{port.get('protocol', 'tcp')} - {port.get('service', 'unknown')}")
+
+        lines.extend([
+            "",
+            "-" * 40,
+            "DETECTED TECHNOLOGIES",
+            "-" * 40,
+        ])
+        for tech in ctx['data']['technologies'][:20]:
+            lines.append(f"  - {tech}")
+
+        lines.extend([
+            "",
+            "-" * 40,
+            "URLs WITH PARAMETERS (for injection testing)",
+            "-" * 40,
+        ])
+        for url in ctx['data']['urls']['with_params'][:50]:
+            lines.append(f"  - {url}")
+
+        lines.extend([
+            "",
+            "-" * 40,
+            "API ENDPOINTS",
+            "-" * 40,
+        ])
+        for ep in ctx['data']['api_endpoints']:
+            lines.append(f"  - {ep}")
+
+        lines.extend([
+            "",
+            "-" * 40,
+            "INTERESTING PATHS",
+            "-" * 40,
+        ])
+        for path in ctx['data']['interesting_paths']:
+            lines.append(f"  - {path}")
+
+        lines.extend([
+            "",
+            "-" * 40,
+            "VULNERABILITIES FOUND",
+            "-" * 40,
+            f"Total: {ctx['vulnerabilities']['total']}",
+            f"Critical: {len(ctx['vulnerabilities']['by_severity']['critical'])}",
+            f"High: {len(ctx['vulnerabilities']['by_severity']['high'])}",
+            f"Medium: {len(ctx['vulnerabilities']['by_severity']['medium'])}",
+            f"Low: {len(ctx['vulnerabilities']['by_severity']['low'])}",
+            "",
+        ])
+
+        for vuln in ctx['vulnerabilities']['all'][:30]:
+            lines.append(f"  [{vuln.get('severity', 'INFO').upper()}] {vuln.get('title', 'N/A')}")
+            lines.append(f"       Endpoint: {vuln.get('affected_endpoint', 'N/A')}")
+
+        if ctx['data']['secrets']:
+            lines.extend([
+                "",
+                "-" * 40,
+                "POTENTIAL EXPOSED SECRETS",
+                "-" * 40,
+            ])
+            for secret in ctx['data']['secrets'][:20]:
+                lines.append(f"  [!] {secret[:100]}")
+
+        lines.extend([
+            "",
+            "-" * 40,
+            "RECOMMENDATIONS FOR LLM",
+            "-" * 40,
+        ])
+        for rec in ctx['recommendations']:
+            lines.append(f"  * {rec}")
+
+        lines.extend([
+            "",
+            "=" * 80,
+            "END OF CONTEXT - USE THIS DATA TO ENHANCE TESTING",
+            "=" * 80,
+        ])
+
+        return "\n".join(lines)
+
+    def save(self, session_id: str = None) -> Dict[str, Path]:
+        """Save the consolidated context to files."""
+        if not session_id:
+            session_id = datetime.now().strftime("%Y%m%d_%H%M%S")
+
+        # Paths
+        json_path = self.output_dir / f"context_{session_id}.json"
+        txt_path = self.output_dir / f"context_{session_id}.txt"
+
+        # Build and save JSON
+        context = self.build()
+        with open(json_path, 'w') as f:
+            json.dump(context, f, indent=2, default=str)
+
+        # Build and save TXT
+        text_context = self.build_text_context()
+        with open(txt_path, 'w') as f:
+            f.write(text_context)
+
+        logger.info(f"Context saved to: {json_path} and {txt_path}")
+
+        return {
+            "json": json_path,
+            "txt": txt_path,
+            "context": context
+        }
+
+    def get_llm_prompt_context(self) -> str:
+        """Return context formatted for inclusion in LLM prompt."""
+        return self.build_text_context()
+
+
+def load_context_from_file(context_file: str) -> Optional[Dict]:
+    """Load recon context from a JSON file."""
+    try:
+        with open(context_file, 'r') as f:
+            return json.load(f)
+    except Exception as e:
+        logger.error(f"Error loading context: {e}")
+        return None
+
+
+def merge_contexts(contexts: List[Dict]) -> Dict:
+    """Merge multiple recon contexts into one."""
+    merged = ReconContextBuilder()
+
+    for ctx in contexts:
+        data = ctx.get('data', {})
+
+        merged.add_subdomains(data.get('subdomains', []))
+        merged.add_live_hosts(data.get('live_hosts', []))
+        merged.add_urls(data.get('urls', {}).get('all', []))
+        merged.add_open_ports(data.get('open_ports', []))
+        merged.add_technologies(data.get('technologies', []))
+        merged.add_dns_records(data.get('dns_records', []))
+        merged.add_js_files(data.get('js_files', []))
+        merged.add_api_endpoints(data.get('api_endpoints', []))
+        merged.add_secrets(data.get('secrets', []))
+
+        for vuln in ctx.get('vulnerabilities', {}).get('all', []):
+            merged.add_vulnerabilities([vuln])
+
+    return merged.build()
--- a/core/pentest_executor.py
+++ b/core/pentest_executor.py
@@ -54,15 +54,137 @@ class ScanResult:
 class PentestExecutor:
    """Executes real pentest tools and captures outputs"""

-    def __init__(self, target: str, config: Dict = None):
+    def __init__(self, target: str, config: Dict = None, recon_context: Dict = None):
        self.target = self._normalize_target(target)
        self.config = config or {}
+        self.recon_context = recon_context  # Contexto consolidado do recon
        self.scan_result = ScanResult(
            target=self.target,
            scan_started=datetime.now().isoformat()
        )
        self.timeout = 300  # 5 minutes default timeout

+        # Se tiver contexto de recon, pre-popula dados
+        if self.recon_context:
+            self._load_from_recon_context()
+
+    def _load_from_recon_context(self):
+        """Carrega dados do contexto de recon consolidado."""
+        if not self.recon_context:
+            return
+
+        data = self.recon_context.get('data', {})
+
+        # Carrega tecnologias detectadas
+        techs = data.get('technologies', [])
+        self.scan_result.technologies.extend(techs)
+
+        # Carrega portas abertas
+        ports = data.get('open_ports', [])
+        for port in ports:
+            if port not in self.scan_result.open_ports:
+                self.scan_result.open_ports.append(port)
+
+        # Carrega vulnerabilidades ja encontradas
+        vulns = self.recon_context.get('vulnerabilities', {}).get('all', [])
+        for v in vulns:
+            vuln = Vulnerability(
+                title=v.get('title', v.get('name', 'Unknown')),
+                severity=v.get('severity', 'Info').capitalize(),
+                cvss_score=self._severity_to_cvss(v.get('severity', 'info')),
+                cvss_vector="",
+                description=v.get('description', ''),
+                affected_endpoint=v.get('affected_endpoint', v.get('url', self.target)),
+                impact=f"{v.get('severity', 'info')} severity vulnerability",
+                poc_request=v.get('curl_command', ''),
+                poc_response="",
+                poc_payload="",
+                remediation="Apply vendor patches and security best practices"
+            )
+            self.scan_result.vulnerabilities.append(vuln)
+
+        logger.info(f"Carregados do recon: {len(techs)} techs, {len(ports)} portas, {len(vulns)} vulns")
+
+    @classmethod
+    def load_context_from_file(cls, context_file: str) -> Optional[Dict]:
+        """Carrega contexto de recon de um arquivo JSON."""
+        try:
+            with open(context_file, 'r') as f:
+                return json.load(f)
+        except Exception as e:
+            logger.error(f"Erro ao carregar contexto: {e}")
+            return None
+
+    def get_urls_with_params(self) -> List[str]:
+        """Retorna URLs com parametros do contexto para testes de injecao."""
+        if not self.recon_context:
+            return []
+
+        data = self.recon_context.get('data', {})
+        urls = data.get('urls', {})
+
+        if isinstance(urls, dict):
+            return urls.get('with_params', [])
+        return []
+
+    def get_api_endpoints(self) -> List[str]:
+        """Retorna endpoints de API do contexto."""
+        if not self.recon_context:
+            return []
+
+        data = self.recon_context.get('data', {})
+        return data.get('api_endpoints', [])
+
+    def get_interesting_paths(self) -> List[str]:
+        """Retorna caminhos interessantes do contexto."""
+        if not self.recon_context:
+            return []
+
+        data = self.recon_context.get('data', {})
+        return data.get('interesting_paths', [])
+
+    def get_live_hosts(self) -> List[str]:
+        """Retorna hosts ativos do contexto."""
+        if not self.recon_context:
+            return []
+
+        data = self.recon_context.get('data', {})
+        return data.get('live_hosts', [])
+
+    def get_context_for_llm(self) -> str:
+        """Retorna o contexto formatado para incluir no prompt do LLM."""
+        if not self.recon_context:
+            return ""
+
+        lines = [
+            "=== CONTEXTO DE RECON CONSOLIDADO ===",
+            f"Alvo: {self.recon_context.get('target', {}).get('primary_target', 'N/A')}",
+            "",
+            "SUPERFICIE DE ATAQUE:",
+        ]
+
+        attack_surface = self.recon_context.get('attack_surface', {})
+        for key, value in attack_surface.items():
+            lines.append(f"  - {key}: {value}")
+
+        lines.append("\nTECNOLOGIAS DETECTADAS:")
+        for tech in self.scan_result.technologies[:10]:
+            lines.append(f"  - {tech}")
+
+        lines.append("\nURLs COM PARAMETROS (para testes de injecao):")
+        for url in self.get_urls_with_params()[:20]:
+            lines.append(f"  - {url}")
+
+        lines.append("\nENDPOINTS DE API:")
+        for ep in self.get_api_endpoints()[:10]:
+            lines.append(f"  - {ep}")
+
+        lines.append("\nVULNERABILIDADES JA ENCONTRADAS:")
+        for vuln in self.scan_result.vulnerabilities[:10]:
+            lines.append(f"  - [{vuln.severity}] {vuln.title}")
+
+        return "\n".join(lines)
+
    def _normalize_target(self, target: str) -> str:
        """Normalize target URL/IP"""
        target = target.strip()