cyber_llm / src /agents /safety_agent.py
unit731's picture
Upload core Cyber-LLM platform components
23804b3 verified
raw
history blame
21.1 kB
"""
SafetyAgent: OPSEC Compliance and Safety Validation Agent
Validates operations for OPSEC compliance and safety considerations.
"""
import json
import logging
import re
from typing import Dict, List, Optional, Any, Tuple
from dataclasses import dataclass
from pathlib import Path
from enum import Enum
class RiskLevel(Enum):
LOW = "low"
MEDIUM = "medium"
HIGH = "high"
CRITICAL = "critical"
@dataclass
class SafetyCheck:
"""Safety check result."""
check_name: str
risk_level: RiskLevel
description: str
violations: List[str]
recommendations: List[str]
@dataclass
class SafetyAssessment:
"""Complete safety assessment result."""
overall_risk: RiskLevel
checks: List[SafetyCheck]
approved: bool
summary: str
safe_alternatives: List[str]
class SafetyAgent:
"""Advanced safety and OPSEC compliance validation agent."""
def __init__(self, config_path: Optional[Path] = None):
self.logger = logging.getLogger(__name__)
self.config = self._load_config(config_path)
self.opsec_rules = self._load_opsec_rules()
self.risk_patterns = self._load_risk_patterns()
def _load_config(self, config_path: Optional[Path]) -> Dict:
"""Load safety agent configuration."""
default_config = {
'strict_mode': True,
'auto_approve_low_risk': False,
'require_human_approval': ['high', 'critical'],
'logging_level': 'INFO',
'detection_threshold': 0.7
}
if config_path and config_path.exists():
with open(config_path, 'r') as f:
user_config = json.load(f)
default_config.update(user_config)
return default_config
def _load_opsec_rules(self) -> Dict:
"""Load OPSEC rules and best practices."""
return {
'timing_rules': {
'max_requests_per_minute': 10,
'min_delay_between_scans': 1000, # milliseconds
'avoid_business_hours': True,
'spread_over_days': ['high', 'maximum']
},
'stealth_rules': {
'use_decoy_ips': ['high', 'maximum'],
'fragment_packets': ['medium', 'high', 'maximum'],
'randomize_source_ports': True,
'avoid_default_timing': ['medium', 'high', 'maximum']
},
'target_rules': {
'avoid_honeypots': True,
'check_threat_intelligence': True,
'respect_robots_txt': True,
'avoid_government_domains': True
},
'operational_rules': {
'log_all_activities': True,
'use_vpn_tor': ['high', 'maximum'],
'rotate_infrastructure': ['high', 'maximum'],
'monitor_defensive_responses': True
}
}
def _load_risk_patterns(self) -> Dict:
"""Load patterns that indicate high-risk activities."""
return {
'high_detection_commands': [
r'-A\b', # Aggressive scan
r'--script.*vuln', # Vulnerability scripts
r'-sU.*-sS', # UDP + SYN scan combination
r'--top-ports\s+(\d+)', # High port count
r'-T[45]', # Aggressive timing
r'--min-rate\s+\d{3,}', # High rate scanning
r'nikto', # Web vulnerability scanner
r'sqlmap', # SQL injection tool
r'hydra', # Brute force tool
r'john', # Password cracker
r'hashcat' # Password cracker
],
'opsec_violations': [
r'--reason', # Custom scan reason (logging risk)
r'-v{2,}', # High verbosity
r'--packet-trace', # Packet tracing
r'--traceroute', # Network path disclosure
r'-sn.*--traceroute', # Ping sweep with traceroute
r'--source-port\s+53', # DNS source port spoofing
r'--data-string', # Custom data (potential signature)
],
'infrastructure_risks': [
r'shodan.*api', # Shodan API usage
r'censys.*search', # Censys API usage
r'virustotal', # VirusTotal queries
r'threatcrowd', # Threat intelligence queries
r'passivetotal' # PassiveTotal queries
],
'time_sensitive': [
r'while.*true', # Infinite loops
r'for.*in.*range\(\s*\d{3,}', # Large iterations
r'sleep\s+[0-9]*[.][0-9]+', # Very short delays
r'--max-rate', # Rate limiting bypass
]
}
def validate_commands(self, commands: Dict[str, List[str]], opsec_level: str = 'medium') -> SafetyAssessment:
"""
Validate a set of commands for OPSEC compliance and safety.
Args:
commands: Dictionary of command categories and command lists
opsec_level: Required OPSEC level ('low', 'medium', 'high', 'maximum')
Returns:
SafetyAssessment with validation results
"""
self.logger.info(f"Validating commands for OPSEC level: {opsec_level}")
checks = []
# Perform individual safety checks
checks.append(self._check_detection_risk(commands))
checks.append(self._check_opsec_compliance(commands, opsec_level))
checks.append(self._check_timing_compliance(commands, opsec_level))
checks.append(self._check_infrastructure_safety(commands))
checks.append(self._check_target_appropriateness(commands))
# Calculate overall risk
overall_risk = self._calculate_overall_risk(checks)
# Determine approval status
approved = self._determine_approval(overall_risk, opsec_level)
# Generate summary
summary = self._generate_summary(checks, overall_risk, approved)
# Generate safe alternatives if not approved
safe_alternatives = []
if not approved:
safe_alternatives = self._generate_safe_alternatives(commands, opsec_level)
return SafetyAssessment(
overall_risk=overall_risk,
checks=checks,
approved=approved,
summary=summary,
safe_alternatives=safe_alternatives
)
def _check_detection_risk(self, commands: Dict[str, List[str]]) -> SafetyCheck:
"""Check for commands with high detection risk."""
violations = []
recommendations = []
all_commands = []
for cmd_list in commands.values():
all_commands.extend(cmd_list)
command_text = ' '.join(all_commands)
for pattern in self.risk_patterns['high_detection_commands']:
matches = re.findall(pattern, command_text, re.IGNORECASE)
if matches:
violations.append(f"High-detection pattern found: {pattern}")
# Check for aggressive scanning combinations
if '-sS' in command_text and '-sV' in command_text:
violations.append("Aggressive scanning combination: SYN scan + service detection")
if len(violations) == 0:
risk_level = RiskLevel.LOW
description = "No high-detection risk patterns found"
elif len(violations) <= 2:
risk_level = RiskLevel.MEDIUM
description = "Some detection risk patterns identified"
recommendations.extend([
"Consider using stealth timing (-T1 or -T2)",
"Add packet fragmentation (-f)",
"Implement delays between scans"
])
else:
risk_level = RiskLevel.HIGH
description = "Multiple high-detection risk patterns found"
recommendations.extend([
"Significantly reduce scanning aggressiveness",
"Use passive techniques where possible",
"Implement substantial delays",
"Consider using decoy IPs"
])
return SafetyCheck(
check_name="Detection Risk Analysis",
risk_level=risk_level,
description=description,
violations=violations,
recommendations=recommendations
)
def _check_opsec_compliance(self, commands: Dict[str, List[str]], opsec_level: str) -> SafetyCheck:
"""Check OPSEC compliance based on required level."""
violations = []
recommendations = []
all_commands = ' '.join([' '.join(cmd_list) for cmd_list in commands.values()])
# Check stealth requirements
stealth_rules = self.opsec_rules['stealth_rules']
if opsec_level in ['medium', 'high', 'maximum'] and '-T4' in all_commands:
violations.append("Aggressive timing (-T4) conflicts with stealth requirements")
if opsec_level in ['high', 'maximum'] and not any('-f' in cmd for cmd_list in commands.values() for cmd in cmd_list):
violations.append("Packet fragmentation (-f) recommended for high stealth")
if opsec_level == 'maximum' and any('nmap' in cmd for cmd_list in commands.values() for cmd in cmd_list):
violations.append("Active scanning not recommended for maximum stealth")
# Check for OPSEC violation patterns
for pattern in self.risk_patterns['opsec_violations']:
if re.search(pattern, all_commands, re.IGNORECASE):
violations.append(f"OPSEC violation pattern: {pattern}")
# Determine risk level
if len(violations) == 0:
risk_level = RiskLevel.LOW
description = f"Commands comply with {opsec_level} OPSEC requirements"
elif len(violations) <= 2:
risk_level = RiskLevel.MEDIUM
description = f"Minor OPSEC compliance issues for {opsec_level} level"
else:
risk_level = RiskLevel.HIGH
description = f"Significant OPSEC violations for {opsec_level} level"
# Generate recommendations based on OPSEC level
if opsec_level == 'maximum':
recommendations.extend([
"Use only passive reconnaissance techniques",
"Employ Tor or VPN for all queries",
"Spread activities over multiple days"
])
elif opsec_level == 'high':
recommendations.extend([
"Use stealth timing (-T1 or -T2)",
"Implement packet fragmentation",
"Add significant delays between operations"
])
return SafetyCheck(
check_name="OPSEC Compliance",
risk_level=risk_level,
description=description,
violations=violations,
recommendations=recommendations
)
def _check_timing_compliance(self, commands: Dict[str, List[str]], opsec_level: str) -> SafetyCheck:
"""Check timing and rate limiting compliance."""
violations = []
recommendations = []
all_commands = ' '.join([' '.join(cmd_list) for cmd_list in commands.values()])
# Check for timing violations
timing_rules = self.opsec_rules['timing_rules']
# Check for aggressive timing
aggressive_timing = re.findall(r'-T([45])', all_commands)
if aggressive_timing and opsec_level in ['medium', 'high', 'maximum']:
violations.append(f"Aggressive timing (-T{'/'.join(aggressive_timing)}) violates {opsec_level} OPSEC")
# Check for high rate scanning
rate_matches = re.findall(r'--min-rate\s+(\d+)', all_commands)
if rate_matches:
for rate in rate_matches:
if int(rate) > 100 and opsec_level in ['high', 'maximum']:
violations.append(f"High scan rate ({rate}) not suitable for {opsec_level} OPSEC")
# Check for insufficient delays
delay_matches = re.findall(r'--scan-delay\s+(\d+)', all_commands)
if opsec_level in ['high', 'maximum'] and not delay_matches:
violations.append("Scan delays not specified for high stealth requirement")
risk_level = RiskLevel.LOW if len(violations) == 0 else (
RiskLevel.MEDIUM if len(violations) <= 2 else RiskLevel.HIGH
)
if risk_level != RiskLevel.LOW:
recommendations.extend([
"Implement appropriate scan timing for OPSEC level",
"Add delays between scan phases",
"Consider spreading scans over longer time periods"
])
return SafetyCheck(
check_name="Timing Compliance",
risk_level=risk_level,
description=f"Timing analysis for {opsec_level} OPSEC level",
violations=violations,
recommendations=recommendations
)
def _check_infrastructure_safety(self, commands: Dict[str, List[str]]) -> SafetyCheck:
"""Check for infrastructure and API safety."""
violations = []
recommendations = []
all_commands = ' '.join([' '.join(cmd_list) for cmd_list in commands.values()])
# Check for infrastructure risks
for pattern in self.risk_patterns['infrastructure_risks']:
if re.search(pattern, all_commands, re.IGNORECASE):
violations.append(f"Infrastructure risk: {pattern}")
# Check for API key exposure
if 'api' in all_commands.lower() and 'key' in all_commands.lower():
violations.append("Potential API key exposure in commands")
risk_level = RiskLevel.LOW if len(violations) == 0 else RiskLevel.MEDIUM
if violations:
recommendations.extend([
"Secure API keys using environment variables",
"Use VPN/proxy for external API queries",
"Monitor API usage quotas"
])
return SafetyCheck(
check_name="Infrastructure Safety",
risk_level=risk_level,
description="Infrastructure and API safety analysis",
violations=violations,
recommendations=recommendations
)
def _check_target_appropriateness(self, commands: Dict[str, List[str]]) -> SafetyCheck:
"""Check target appropriateness and legal considerations."""
violations = []
recommendations = []
# Extract targets from commands
targets = self._extract_targets_from_commands(commands)
for target in targets:
# Check for government domains
if any(gov_tld in target.lower() for gov_tld in ['.gov', '.mil', '.fed']):
violations.append(f"Government domain detected: {target}")
# Check for known honeypot indicators
if any(honeypot in target.lower() for honeypot in ['honeypot', 'canary', 'trap']):
violations.append(f"Potential honeypot detected: {target}")
risk_level = RiskLevel.CRITICAL if any('.gov' in v or '.mil' in v for v in violations) else (
RiskLevel.HIGH if violations else RiskLevel.LOW
)
if risk_level != RiskLevel.LOW:
recommendations.extend([
"Verify authorization for all targets",
"Review legal implications",
"Consider using test environments"
])
return SafetyCheck(
check_name="Target Appropriateness",
risk_level=risk_level,
description="Target selection and legal compliance",
violations=violations,
recommendations=recommendations
)
def _extract_targets_from_commands(self, commands: Dict[str, List[str]]) -> List[str]:
"""Extract target IPs/domains from commands."""
targets = []
for cmd_list in commands.values():
for cmd in cmd_list:
# Simple regex to find IP addresses and domains
ip_pattern = r'\b(?:\d{1,3}\.){3}\d{1,3}\b'
domain_pattern = r'\b[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?(?:\.[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?)*\b'
targets.extend(re.findall(ip_pattern, cmd))
targets.extend(re.findall(domain_pattern, cmd))
return list(set(targets)) # Remove duplicates
def _calculate_overall_risk(self, checks: List[SafetyCheck]) -> RiskLevel:
"""Calculate overall risk level from individual checks."""
risk_scores = {
RiskLevel.LOW: 1,
RiskLevel.MEDIUM: 2,
RiskLevel.HIGH: 3,
RiskLevel.CRITICAL: 4
}
max_risk = max(check.risk_level for check in checks)
avg_risk = sum(risk_scores[check.risk_level] for check in checks) / len(checks)
# If any check is critical, overall is critical
if max_risk == RiskLevel.CRITICAL:
return RiskLevel.CRITICAL
# If average risk is high, overall is high
if avg_risk >= 3.0:
return RiskLevel.HIGH
elif avg_risk >= 2.0:
return RiskLevel.MEDIUM
else:
return RiskLevel.LOW
def _determine_approval(self, overall_risk: RiskLevel, opsec_level: str) -> bool:
"""Determine if commands are approved based on risk and configuration."""
if overall_risk == RiskLevel.CRITICAL:
return False
if overall_risk == RiskLevel.HIGH and self.config['strict_mode']:
return False
if overall_risk.value in self.config['require_human_approval']:
self.logger.warning(f"HUMAN APPROVAL REQUIRED for {overall_risk.value} risk level")
return False # Requires manual approval
if overall_risk == RiskLevel.LOW and self.config['auto_approve_low_risk']:
return True
return overall_risk in [RiskLevel.LOW, RiskLevel.MEDIUM]
def _generate_summary(self, checks: List[SafetyCheck], overall_risk: RiskLevel, approved: bool) -> str:
"""Generate a summary of the safety assessment."""
violation_count = sum(len(check.violations) for check in checks)
status = "APPROVED" if approved else "REJECTED"
summary = f"Safety Assessment: {status}\n"
summary += f"Overall Risk Level: {overall_risk.value.upper()}\n"
summary += f"Total Violations: {violation_count}\n"
if not approved:
summary += "\nREASONS FOR REJECTION:\n"
for check in checks:
if check.violations:
summary += f"- {check.check_name}: {len(check.violations)} violations\n"
return summary
def _generate_safe_alternatives(self, commands: Dict[str, List[str]], opsec_level: str) -> List[str]:
"""Generate safer alternative commands."""
alternatives = []
# General safer alternatives
alternatives.extend([
"Use passive reconnaissance techniques first",
"Implement longer delays between scans (--scan-delay 2000ms)",
"Use stealth timing (-T1 or -T2)",
"Add packet fragmentation (-f)",
"Reduce port scan range (--top-ports 100)",
"Use decoy IPs (-D RND:10)"
])
if opsec_level in ['high', 'maximum']:
alternatives.extend([
"Consider using only passive techniques",
"Employ Tor/VPN for all reconnaissance",
"Spread activities over multiple days",
"Use different source IPs for different phases"
])
return alternatives
# Example usage and testing
if __name__ == "__main__":
# Configure logging
logging.basicConfig(level=logging.INFO)
# Initialize safety agent
agent = SafetyAgent()
# Example commands to validate
test_commands = {
'nmap': [
'nmap -sS -T4 --top-ports 1000 example.com',
'nmap -A -v example.com'
],
'passive': [
'dig example.com ANY',
'whois example.com'
]
}
# Validate commands
assessment = agent.validate_commands(test_commands, opsec_level='high')
print(f"Assessment: {assessment.approved}")
print(f"Overall Risk: {assessment.overall_risk.value}")
print(f"Summary:\n{assessment.summary}")
if assessment.safe_alternatives:
print(f"\nSafe Alternatives:")
for alt in assessment.safe_alternatives:
print(f"- {alt}")