diff --git a/agentic-aiops/__init__.py b/agentic-aiops/__init__.py
new file mode 100644
index 0000000..471fc2a
--- /dev/null
+++ b/agentic-aiops/__init__.py
@@ -0,0 +1,65 @@
+"""AgenticAIOps: Intelligent autonomous operations framework for trading infrastructure."""
+
+from __future__ import annotations
+
+from loguru import logger
+
+from agentic_aiops.agents.monitoring_agent import MonitoringAgent
+from agentic_aiops.agents.healing_agent import HealingAgent
+from agentic_aiops.agents.optimization_agent import OptimizationAgent
+from agentic_aiops.agents.security_agent import SecurityAgent
+from agentic_aiops.anomaly_detection.time_series_anomaly import TimeSeriesAnomaly
+from agentic_aiops.anomaly_detection.log_anomaly import LogAnomaly
+from agentic_aiops.anomaly_detection.behavior_anomaly import BehaviorAnomaly
+from agentic_aiops.automation.incident_response import IncidentResponse
+from agentic_aiops.automation.capacity_planning import CapacityPlanning
+from agentic_aiops.automation.chaos_engineering import ChaosEngineering
+
+
+class AgenticAIOps:
+    """Unified agentic AIOps orchestrator for trading platform infrastructure.
+
+    Aggregates autonomous monitoring, self-healing, optimisation, security,
+    anomaly detection, and automation components.
+
+    Attributes:
+        monitoring: System health monitoring agent.
+        healing: Self-healing automation agent.
+        optimization: Resource optimisation agent.
+        security: Threat detection and response agent.
+        ts_anomaly: Time-series anomaly detector.
+        log_anomaly: Log pattern anomaly detector.
+        behavior_anomaly: Behavioral anomaly detector.
+        incident_response: Automated incident handler.
+        capacity_planning: Auto-scaling and capacity planner.
+        chaos_engineering: Resilience testing framework.
+    """
+
+    def __init__(self) -> None:
+        """Initialise all AgenticAIOps sub-components."""
+        self.monitoring = MonitoringAgent()
+        self.healing = HealingAgent()
+        self.optimization = OptimizationAgent()
+        self.security = SecurityAgent()
+        self.ts_anomaly = TimeSeriesAnomaly()
+        self.log_anomaly = LogAnomaly()
+        self.behavior_anomaly = BehaviorAnomaly()
+        self.incident_response = IncidentResponse()
+        self.capacity_planning = CapacityPlanning()
+        self.chaos_engineering = ChaosEngineering()
+        logger.info("AgenticAIOps initialised")
+
+    def status(self) -> dict[str, str]:
+        """Return a health summary for all sub-components.
+
+        Returns:
+            Mapping of component name to status string.
+        """
+        return {name: "ready" for name in [
+            "monitoring", "healing", "optimization", "security",
+            "ts_anomaly", "log_anomaly", "behavior_anomaly",
+            "incident_response", "capacity_planning", "chaos_engineering",
+        ]}
+
+
+__all__ = ["AgenticAIOps"]
diff --git a/agentic-aiops/__pycache__/__init__.cpython-312.pyc b/agentic-aiops/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..3864be3
Binary files /dev/null and b/agentic-aiops/__pycache__/__init__.cpython-312.pyc differ
diff --git a/agentic-aiops/agents/__init__.py b/agentic-aiops/agents/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/agentic-aiops/agents/__pycache__/__init__.cpython-312.pyc b/agentic-aiops/agents/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..fe82733
Binary files /dev/null and b/agentic-aiops/agents/__pycache__/__init__.cpython-312.pyc differ
diff --git a/agentic-aiops/agents/__pycache__/healing_agent.cpython-312.pyc b/agentic-aiops/agents/__pycache__/healing_agent.cpython-312.pyc
new file mode 100644
index 0000000..26268de
Binary files /dev/null and b/agentic-aiops/agents/__pycache__/healing_agent.cpython-312.pyc differ
diff --git a/agentic-aiops/agents/__pycache__/monitoring_agent.cpython-312.pyc b/agentic-aiops/agents/__pycache__/monitoring_agent.cpython-312.pyc
new file mode 100644
index 0000000..cba5d13
Binary files /dev/null and b/agentic-aiops/agents/__pycache__/monitoring_agent.cpython-312.pyc differ
diff --git a/agentic-aiops/agents/__pycache__/optimization_agent.cpython-312.pyc b/agentic-aiops/agents/__pycache__/optimization_agent.cpython-312.pyc
new file mode 100644
index 0000000..0d128c2
Binary files /dev/null and b/agentic-aiops/agents/__pycache__/optimization_agent.cpython-312.pyc differ
diff --git a/agentic-aiops/agents/__pycache__/security_agent.cpython-312.pyc b/agentic-aiops/agents/__pycache__/security_agent.cpython-312.pyc
new file mode 100644
index 0000000..02dafe2
Binary files /dev/null and b/agentic-aiops/agents/__pycache__/security_agent.cpython-312.pyc differ
diff --git a/agentic-aiops/agents/healing_agent.py b/agentic-aiops/agents/healing_agent.py
new file mode 100644
index 0000000..4acb0d6
--- /dev/null
+++ b/agentic-aiops/agents/healing_agent.py
@@ -0,0 +1,309 @@
+"""Self-healing automation agent for trading infrastructure."""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class FailureType(Enum):
+    """Categories of detectable infrastructure failures."""
+
+    PROCESS_CRASH = auto()
+    MEMORY_LEAK = auto()
+    DEADLOCK = auto()
+    NETWORK_PARTITION = auto()
+    DISK_FULL = auto()
+    HIGH_CPU = auto()
+    SERVICE_DEGRADATION = auto()
+    UNKNOWN = auto()
+
+
+class RemediationStatus(Enum):
+    """Outcome of a remediation action."""
+
+    SUCCESS = auto()
+    PARTIAL = auto()
+    FAILED = auto()
+    SKIPPED = auto()
+
+
+@dataclass
+class FailureDiagnosis:
+    """Result of failure diagnosis.
+
+    Attributes:
+        failure_type: Classified failure category.
+        component: Affected component name.
+        confidence: Diagnosis confidence (0–1).
+        root_cause: Human-readable root cause summary.
+        recommended_actions: Ordered list of recommended remediation steps.
+        diagnosed_at: UTC timestamp.
+    """
+
+    failure_type: FailureType
+    component: str
+    confidence: float
+    root_cause: str
+    recommended_actions: list[str]
+    diagnosed_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class RemediationResult:
+    """Outcome of an automated remediation attempt.
+
+    Attributes:
+        component: Remediated component.
+        action: Description of the action taken.
+        status: Outcome status.
+        details: Additional diagnostic information.
+        executed_at: UTC timestamp.
+        duration_ms: Time taken for the action.
+    """
+
+    component: str
+    action: str
+    status: RemediationStatus
+    details: dict[str, Any] = field(default_factory=dict)
+    executed_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    duration_ms: float = 0.0
+
+
+class HealingAgent:
+    """Autonomous self-healing agent for trading infrastructure.
+
+    Detects infrastructure failures, diagnoses root causes using
+    heuristic pattern matching, and executes remediation runbooks.
+
+    Attributes:
+        remediation_history: Log of all executed remediation actions.
+        _runbooks: Mapping of failure type to remediation steps.
+        _max_retries: Maximum auto-remediation attempts per incident.
+    """
+
+    # Heuristic runbooks: failure type → ordered remediation steps
+    _DEFAULT_RUNBOOKS: dict[FailureType, list[str]] = {
+        FailureType.PROCESS_CRASH: [
+            "check_process_status",
+            "collect_crash_dump",
+            "restart_process",
+            "verify_restart",
+        ],
+        FailureType.MEMORY_LEAK: [
+            "capture_heap_dump",
+            "graceful_restart",
+            "adjust_gc_settings",
+            "monitor_memory",
+        ],
+        FailureType.DEADLOCK: [
+            "capture_thread_dump",
+            "identify_contended_locks",
+            "force_restart",
+            "enable_deadlock_detection",
+        ],
+        FailureType.NETWORK_PARTITION: [
+            "test_connectivity",
+            "check_dns_resolution",
+            "failover_to_backup",
+            "notify_network_team",
+        ],
+        FailureType.DISK_FULL: [
+            "identify_large_files",
+            "rotate_logs",
+            "archive_old_data",
+            "alert_operations",
+        ],
+        FailureType.HIGH_CPU: [
+            "identify_hot_processes",
+            "throttle_non_critical_tasks",
+            "scale_out_if_possible",
+            "profile_cpu_usage",
+        ],
+        FailureType.SERVICE_DEGRADATION: [
+            "check_downstream_dependencies",
+            "enable_circuit_breaker",
+            "redirect_traffic",
+            "escalate_if_unresolved",
+        ],
+    }
+
+    def __init__(self, max_retries: int = 3) -> None:
+        """Initialise the healing agent.
+
+        Args:
+            max_retries: Maximum remediation attempts per incident.
+        """
+        self.remediation_history: list[RemediationResult] = []
+        self._runbooks = dict(self._DEFAULT_RUNBOOKS)
+        self._max_retries = max_retries
+        logger.info("HealingAgent initialised (max_retries={})", max_retries)
+
+    async def detect_failure(
+        self,
+        component: str,
+        metrics: dict[str, float],
+    ) -> FailureType | None:
+        """Detect whether a component has failed based on its metrics.
+
+        Args:
+            component: Component identifier.
+            metrics: Current metric readings keyed by metric name.
+
+        Returns:
+            Detected :class:`FailureType` or ``None`` if healthy.
+        """
+        await asyncio.sleep(0)
+        thresholds: list[tuple[str, float, FailureType]] = [
+            ("cpu_percent", 95.0, FailureType.HIGH_CPU),
+            ("memory_percent", 98.0, FailureType.MEMORY_LEAK),
+            ("disk_percent", 99.0, FailureType.DISK_FULL),
+            ("error_rate", 0.5, FailureType.SERVICE_DEGRADATION),
+            ("process_uptime_s", 0.0, FailureType.PROCESS_CRASH),  # 0 = not running
+        ]
+
+        for metric_name, threshold, failure_type in thresholds:
+            value = metrics.get(metric_name)
+            if value is not None:
+                if metric_name == "process_uptime_s" and value <= threshold:
+                    logger.warning("Failure detected in '{}': {}", component, failure_type.name)
+                    return failure_type
+                elif metric_name != "process_uptime_s" and value >= threshold:
+                    logger.warning("Failure detected in '{}': {}", component, failure_type.name)
+                    return failure_type
+
+        return None
+
+    async def diagnose(
+        self,
+        component: str,
+        failure_type: FailureType,
+        context: dict[str, Any] | None = None,
+    ) -> FailureDiagnosis:
+        """Diagnose the root cause of a detected failure.
+
+        Args:
+            component: Affected component.
+            failure_type: Pre-classified failure type.
+            context: Additional diagnostic context (logs, stack traces, etc.).
+
+        Returns:
+            :class:`FailureDiagnosis` with root cause and recommended actions.
+        """
+        await asyncio.sleep(0)
+        context = context or {}
+        rng = np.random.default_rng(seed=hash(component + failure_type.name) % (2**32))
+        confidence = round(float(rng.uniform(0.65, 0.95)), 2)
+
+        root_cause_map: dict[FailureType, str] = {
+            FailureType.PROCESS_CRASH: f"{component} process exited unexpectedly (OOM or segfault)",
+            FailureType.MEMORY_LEAK: f"{component} memory consumption growing unbounded",
+            FailureType.DEADLOCK: f"{component} threads waiting on circular lock dependency",
+            FailureType.NETWORK_PARTITION: f"{component} cannot reach required upstream services",
+            FailureType.DISK_FULL: f"{component} host disk exhausted — likely log accumulation",
+            FailureType.HIGH_CPU: f"{component} CPU saturated — possible hot-loop or thundering herd",
+            FailureType.SERVICE_DEGRADATION: f"{component} exhibiting elevated error rates",
+            FailureType.UNKNOWN: f"{component} exhibiting anomalous behaviour",
+        }
+
+        recommended_actions = self._runbooks.get(failure_type, ["manual_investigation"])
+        diagnosis = FailureDiagnosis(
+            failure_type=failure_type,
+            component=component,
+            confidence=confidence,
+            root_cause=root_cause_map.get(failure_type, "unknown"),
+            recommended_actions=recommended_actions,
+        )
+        logger.info(
+            "Diagnosis for '{}': {} (confidence={:.0%}) — {}",
+            component,
+            failure_type.name,
+            confidence,
+            diagnosis.root_cause,
+        )
+        return diagnosis
+
+    async def remediate(
+        self,
+        diagnosis: FailureDiagnosis,
+    ) -> list[RemediationResult]:
+        """Execute the remediation runbook for a diagnosed failure.
+
+        Args:
+            diagnosis: Completed diagnosis from :meth:`diagnose`.
+
+        Returns:
+            List of :class:`RemediationResult` for each executed step.
+        """
+        results: list[RemediationResult] = []
+        actions = diagnosis.recommended_actions
+
+        logger.info(
+            "Remediating '{}' ({}): {} steps",
+            diagnosis.component,
+            diagnosis.failure_type.name,
+            len(actions),
+        )
+
+        for attempt in range(1, self._max_retries + 1):
+            for action in actions:
+                result = await self._execute_action(diagnosis.component, action)
+                results.append(result)
+                self.remediation_history.append(result)
+
+                if result.status == RemediationStatus.FAILED:
+                    logger.warning(
+                        "Action '{}' failed on attempt {} — continuing", action, attempt
+                    )
+                else:
+                    logger.info("Action '{}' → {}", action, result.status.name)
+
+            # Check if remediation was successful
+            if all(r.status in (RemediationStatus.SUCCESS, RemediationStatus.SKIPPED)
+                   for r in results):
+                logger.info(
+                    "Remediation complete for '{}' after {} step(s)", diagnosis.component, len(results)
+                )
+                return results
+
+        logger.error(
+            "Remediation exhausted for '{}' after {} attempts", diagnosis.component, self._max_retries
+        )
+        return results
+
+    async def _execute_action(self, component: str, action: str) -> RemediationResult:
+        """Execute a single remediation action (simulated).
+
+        Args:
+            component: Target component.
+            action: Action name from the runbook.
+
+        Returns:
+            :class:`RemediationResult` for the executed action.
+        """
+        import time
+        start = time.monotonic()
+        await asyncio.sleep(0)
+        duration_ms = (time.monotonic() - start) * 1000
+
+        rng = np.random.default_rng(seed=hash(component + action) % (2**32))
+        success_prob = 0.85
+        status = (
+            RemediationStatus.SUCCESS
+            if rng.random() < success_prob
+            else RemediationStatus.PARTIAL
+        )
+
+        return RemediationResult(
+            component=component,
+            action=action,
+            status=status,
+            details={"simulated": True},
+            duration_ms=round(duration_ms * 100, 2),
+        )
diff --git a/agentic-aiops/agents/monitoring_agent.py b/agentic-aiops/agents/monitoring_agent.py
new file mode 100644
index 0000000..ab6abb5
--- /dev/null
+++ b/agentic-aiops/agents/monitoring_agent.py
@@ -0,0 +1,254 @@
+"""Async system health monitoring agent."""
+
+from __future__ import annotations
+
+import asyncio
+import time
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class AlertSeverity(Enum):
+    """Categorical alert severity levels."""
+
+    INFO = auto()
+    WARNING = auto()
+    CRITICAL = auto()
+
+
+@dataclass
+class HealthCheck:
+    """Result of a single component health check.
+
+    Attributes:
+        component: Name of the checked component.
+        healthy: Overall health flag.
+        latency_ms: Check round-trip time.
+        details: Additional diagnostic key-value pairs.
+        checked_at: UTC timestamp.
+    """
+
+    component: str
+    healthy: bool
+    latency_ms: float
+    details: dict[str, Any] = field(default_factory=dict)
+    checked_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class MetricReading:
+    """A single system metric reading.
+
+    Attributes:
+        name: Metric name (e.g. ``"cpu_percent"``).
+        value: Numeric metric value.
+        unit: Unit string (e.g. ``"%"``, ``"bytes"``).
+        host: Originating host identifier.
+        collected_at: UTC timestamp.
+    """
+
+    name: str
+    value: float
+    unit: str
+    host: str = "localhost"
+    collected_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class Alert:
+    """A monitoring alert.
+
+    Attributes:
+        alert_id: Unique identifier.
+        component: Affected component.
+        message: Human-readable alert description.
+        severity: Alert severity level.
+        metric_value: The metric value that triggered the alert.
+        threshold: The threshold that was breached.
+        fired_at: UTC timestamp.
+        resolved: Whether the alert has been resolved.
+    """
+
+    alert_id: str
+    component: str
+    message: str
+    severity: AlertSeverity
+    metric_value: float
+    threshold: float
+    fired_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    resolved: bool = False
+
+
+class MonitoringAgent:
+    """Autonomous system health monitoring agent.
+
+    Continuously checks component health, collects metrics, and fires
+    alerts when thresholds are breached.
+
+    Attributes:
+        health_history: Log of all health check results.
+        metrics_buffer: Recent metric readings (FIFO, capped).
+        active_alerts: Currently open alerts keyed by alert_id.
+        _thresholds: Per-metric alert thresholds.
+        _buffer_size: Maximum metrics buffer size.
+    """
+
+    DEFAULT_THRESHOLDS: dict[str, float] = {
+        "cpu_percent": 85.0,
+        "memory_percent": 90.0,
+        "disk_percent": 95.0,
+        "latency_ms": 1000.0,
+        "error_rate": 0.05,
+    }
+
+    def __init__(
+        self,
+        thresholds: dict[str, float] | None = None,
+        buffer_size: int = 10_000,
+    ) -> None:
+        """Initialise the monitoring agent.
+
+        Args:
+            thresholds: Per-metric alert thresholds; merged with defaults.
+            buffer_size: Maximum number of metric readings to retain.
+        """
+        self.health_history: list[HealthCheck] = []
+        self.metrics_buffer: list[MetricReading] = []
+        self.active_alerts: dict[str, Alert] = {}
+        self._thresholds = {**self.DEFAULT_THRESHOLDS, **(thresholds or {})}
+        self._buffer_size = buffer_size
+        self._alert_counter = 0
+        logger.info("MonitoringAgent initialised")
+
+    async def check_health(self, components: list[str] | None = None) -> list[HealthCheck]:
+        """Perform async health checks on the specified components.
+
+        Args:
+            components: Component names to check; defaults to a standard set.
+
+        Returns:
+            List of :class:`HealthCheck` results.
+        """
+        targets = components or ["api_gateway", "order_engine", "market_data", "database", "cache"]
+        tasks = [self._check_component(c) for c in targets]
+        results = await asyncio.gather(*tasks, return_exceptions=False)
+        self.health_history.extend(results)
+
+        unhealthy = [r.component for r in results if not r.healthy]
+        if unhealthy:
+            logger.warning("Unhealthy components detected: {}", unhealthy)
+        else:
+            logger.debug("All {} components healthy", len(results))
+        return results  # type: ignore[return-value]
+
+    async def _check_component(self, component: str) -> HealthCheck:
+        """Check the health of a single component.
+
+        Args:
+            component: Component identifier.
+
+        Returns:
+            :class:`HealthCheck` result.
+        """
+        start = time.monotonic()
+        await asyncio.sleep(0)
+        latency_ms = (time.monotonic() - start) * 1000
+
+        rng = np.random.default_rng(seed=hash(component) % (2**16))
+        healthy = bool(rng.random() > 0.05)  # 95% healthy baseline
+        return HealthCheck(
+            component=component,
+            healthy=healthy,
+            latency_ms=round(latency_ms * 1000, 2),  # realistic simulation
+            details={"simulated": True, "response_code": 200 if healthy else 503},
+        )
+
+    async def collect_metrics(self, host: str = "localhost") -> list[MetricReading]:
+        """Collect a snapshot of system metrics.
+
+        Args:
+            host: Host identifier to tag metrics with.
+
+        Returns:
+            List of :class:`MetricReading` for standard system metrics.
+        """
+        await asyncio.sleep(0)
+        rng = np.random.default_rng(seed=int(time.monotonic() * 1000) % (2**16))
+
+        readings = [
+            MetricReading("cpu_percent", round(float(rng.uniform(20, 95)), 2), "%", host),
+            MetricReading("memory_percent", round(float(rng.uniform(40, 85)), 2), "%", host),
+            MetricReading("disk_percent", round(float(rng.uniform(30, 70)), 2), "%", host),
+            MetricReading("network_bytes_in", round(float(rng.exponential(1e6)), 0), "bytes", host),
+            MetricReading("network_bytes_out", round(float(rng.exponential(5e5)), 0), "bytes", host),
+            MetricReading("latency_ms", round(float(rng.lognormal(4.0, 0.5)), 2), "ms", host),
+            MetricReading("error_rate", round(float(rng.beta(1, 50)), 4), "fraction", host),
+        ]
+
+        # Buffer management
+        self.metrics_buffer.extend(readings)
+        overflow = len(self.metrics_buffer) - self._buffer_size
+        if overflow > 0:
+            self.metrics_buffer = self.metrics_buffer[overflow:]
+
+        # Auto-fire alerts for threshold breaches
+        for reading in readings:
+            if reading.name in self._thresholds:
+                await self.alert(reading)
+
+        logger.debug("Collected {} metric readings from '{}'", len(readings), host)
+        return readings
+
+    async def alert(self, reading: MetricReading) -> Alert | None:
+        """Fire an alert if a metric breaches its threshold.
+
+        Args:
+            reading: The metric reading to evaluate.
+
+        Returns:
+            The fired :class:`Alert`, or ``None`` if no threshold was breached.
+        """
+        threshold = self._thresholds.get(reading.name)
+        if threshold is None or reading.value <= threshold:
+            return None
+
+        self._alert_counter += 1
+        alert_id = f"alert_{self._alert_counter:06d}"
+        severity = (
+            AlertSeverity.CRITICAL
+            if reading.value > threshold * 1.2
+            else AlertSeverity.WARNING
+        )
+
+        alert = Alert(
+            alert_id=alert_id,
+            component=reading.host,
+            message=f"{reading.name} = {reading.value}{reading.unit} exceeds threshold {threshold}",
+            severity=severity,
+            metric_value=reading.value,
+            threshold=threshold,
+        )
+        self.active_alerts[alert_id] = alert
+        log = logger.critical if severity == AlertSeverity.CRITICAL else logger.warning
+        log("ALERT [{}] {}: {}", severity.name, alert_id, alert.message)
+        return alert
+
+    def resolve_alert(self, alert_id: str) -> bool:
+        """Mark an alert as resolved.
+
+        Args:
+            alert_id: Identifier of the alert to resolve.
+
+        Returns:
+            ``True`` if found and resolved, ``False`` if not found.
+        """
+        if alert_id in self.active_alerts:
+            self.active_alerts[alert_id].resolved = True
+            logger.info("Alert '{}' resolved", alert_id)
+            return True
+        return False
diff --git a/agentic-aiops/agents/optimization_agent.py b/agentic-aiops/agents/optimization_agent.py
new file mode 100644
index 0000000..8269711
--- /dev/null
+++ b/agentic-aiops/agents/optimization_agent.py
@@ -0,0 +1,252 @@
+"""Resource optimisation agent for trading infrastructure."""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class ResourceProfile:
+    """Current resource usage profile for a component.
+
+    Attributes:
+        component: Component identifier.
+        cpu_percent: CPU utilisation percentage.
+        memory_mb: Memory used in MB.
+        memory_limit_mb: Configured memory limit.
+        disk_io_mbps: Disk I/O throughput in MB/s.
+        network_mbps: Network throughput in MB/s.
+        thread_count: Number of active threads.
+        profiled_at: UTC timestamp.
+    """
+
+    component: str
+    cpu_percent: float
+    memory_mb: float
+    memory_limit_mb: float
+    disk_io_mbps: float
+    network_mbps: float
+    thread_count: int
+    profiled_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+    @property
+    def memory_utilisation(self) -> float:
+        """Memory utilisation fraction (0–1)."""
+        return self.memory_mb / (self.memory_limit_mb + 1e-6)
+
+
+@dataclass
+class Bottleneck:
+    """A detected resource bottleneck.
+
+    Attributes:
+        component: Affected component.
+        resource: Resource type (``"cpu"``, ``"memory"``, ``"disk"``, ``"network"``).
+        severity: Severity score 0–1.
+        description: Human-readable bottleneck description.
+        detected_at: UTC timestamp.
+    """
+
+    component: str
+    resource: str
+    severity: float
+    description: str
+    detected_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class OptimizationAction:
+    """A recommended optimisation action.
+
+    Attributes:
+        component: Target component.
+        action_type: Category (``"scale_up"``, ``"rebalance"``, ``"tune"``, etc.).
+        description: Specific action description.
+        expected_improvement_pct: Estimated percentage improvement.
+        risk_level: ``"low"``, ``"medium"``, or ``"high"``.
+        applied: Whether the action has been applied.
+    """
+
+    component: str
+    action_type: str
+    description: str
+    expected_improvement_pct: float
+    risk_level: str = "low"
+    applied: bool = False
+
+
+class OptimizationAgent:
+    """Resource optimisation agent for trading platform components.
+
+    Profiles resource usage, identifies bottlenecks, and recommends or
+    executes optimisation actions.
+
+    Attributes:
+        profiles: Latest resource profiles per component.
+        bottleneck_history: Historical bottleneck detections.
+        optimization_history: Applied optimisation actions.
+    """
+
+    _CPU_BOTTLENECK_THRESHOLD: float = 80.0
+    _MEMORY_BOTTLENECK_THRESHOLD: float = 0.85
+    _DISK_IO_BOTTLENECK_THRESHOLD: float = 500.0  # MB/s
+    _NETWORK_BOTTLENECK_THRESHOLD: float = 1000.0  # MB/s
+
+    def __init__(self) -> None:
+        """Initialise the optimisation agent."""
+        self.profiles: dict[str, ResourceProfile] = {}
+        self.bottleneck_history: list[Bottleneck] = []
+        self.optimization_history: list[OptimizationAction] = []
+        logger.info("OptimizationAgent initialised")
+
+    async def profile_usage(self, components: list[str]) -> dict[str, ResourceProfile]:
+        """Profile resource usage for the given components.
+
+        Args:
+            components: List of component names to profile.
+
+        Returns:
+            Mapping of component name to :class:`ResourceProfile`.
+        """
+        tasks = {c: asyncio.create_task(self._profile_component(c)) for c in components}
+        results: dict[str, ResourceProfile] = {}
+
+        for component, task in tasks.items():
+            profile = await task
+            self.profiles[component] = profile
+            results[component] = profile
+
+        logger.debug("Profiled {} components", len(results))
+        return results
+
+    async def _profile_component(self, component: str) -> ResourceProfile:
+        """Simulate profiling for a single component.
+
+        Args:
+            component: Component identifier.
+
+        Returns:
+            Simulated :class:`ResourceProfile`.
+        """
+        await asyncio.sleep(0)
+        rng = np.random.default_rng(seed=hash(component) % (2**32))
+        return ResourceProfile(
+            component=component,
+            cpu_percent=round(float(rng.uniform(10, 90)), 2),
+            memory_mb=round(float(rng.uniform(256, 4096)), 1),
+            memory_limit_mb=4096.0,
+            disk_io_mbps=round(float(rng.exponential(100)), 2),
+            network_mbps=round(float(rng.exponential(200)), 2),
+            thread_count=int(rng.integers(4, 128)),
+        )
+
+    async def identify_bottlenecks(
+        self,
+        profiles: dict[str, ResourceProfile] | None = None,
+    ) -> list[Bottleneck]:
+        """Identify resource bottlenecks from profiles.
+
+        Args:
+            profiles: Profiles to analyse; defaults to ``self.profiles``.
+
+        Returns:
+            List of detected :class:`Bottleneck` objects.
+        """
+        profiles = profiles or self.profiles
+        bottlenecks: list[Bottleneck] = []
+        await asyncio.sleep(0)
+
+        for component, profile in profiles.items():
+            if profile.cpu_percent >= self._CPU_BOTTLENECK_THRESHOLD:
+                severity = profile.cpu_percent / 100.0
+                bottlenecks.append(Bottleneck(
+                    component=component,
+                    resource="cpu",
+                    severity=round(severity, 2),
+                    description=f"CPU at {profile.cpu_percent:.1f}%",
+                ))
+            if profile.memory_utilisation >= self._MEMORY_BOTTLENECK_THRESHOLD:
+                severity = profile.memory_utilisation
+                bottlenecks.append(Bottleneck(
+                    component=component,
+                    resource="memory",
+                    severity=round(severity, 2),
+                    description=f"Memory at {profile.memory_utilisation:.1%}",
+                ))
+            if profile.disk_io_mbps >= self._DISK_IO_BOTTLENECK_THRESHOLD:
+                severity = min(1.0, profile.disk_io_mbps / 1000.0)
+                bottlenecks.append(Bottleneck(
+                    component=component,
+                    resource="disk",
+                    severity=round(severity, 2),
+                    description=f"Disk I/O at {profile.disk_io_mbps:.0f} MB/s",
+                ))
+            if profile.network_mbps >= self._NETWORK_BOTTLENECK_THRESHOLD:
+                severity = min(1.0, profile.network_mbps / 10000.0)
+                bottlenecks.append(Bottleneck(
+                    component=component,
+                    resource="network",
+                    severity=round(severity, 2),
+                    description=f"Network at {profile.network_mbps:.0f} MB/s",
+                ))
+
+        self.bottleneck_history.extend(bottlenecks)
+        if bottlenecks:
+            logger.warning("Identified {} bottleneck(s)", len(bottlenecks))
+        else:
+            logger.debug("No bottlenecks detected")
+        return bottlenecks
+
+    async def optimize(
+        self,
+        bottlenecks: list[Bottleneck],
+        *,
+        auto_apply: bool = False,
+    ) -> list[OptimizationAction]:
+        """Generate and optionally apply optimisation actions.
+
+        Args:
+            bottlenecks: Detected bottlenecks to address.
+            auto_apply: If ``True``, mark actions as applied immediately.
+
+        Returns:
+            List of :class:`OptimizationAction` recommendations.
+        """
+        actions: list[OptimizationAction] = []
+
+        _action_map: dict[str, tuple[str, str, float]] = {
+            "cpu": ("scale_up", "Add CPU cores or horizontal scale-out", 30.0),
+            "memory": ("tune", "Increase memory limit or fix memory leak", 40.0),
+            "disk": ("rebalance", "Enable read cache or offload to object storage", 25.0),
+            "network": ("tune", "Enable network bonding or upgrade NIC", 20.0),
+        }
+
+        for bottleneck in bottlenecks:
+            action_type, description, improvement = _action_map.get(
+                bottleneck.resource, ("investigate", "Manual investigation required", 10.0)
+            )
+            risk = "high" if bottleneck.severity > 0.9 else "medium" if bottleneck.severity > 0.7 else "low"
+            action = OptimizationAction(
+                component=bottleneck.component,
+                action_type=action_type,
+                description=f"{bottleneck.component}: {description}",
+                expected_improvement_pct=improvement * bottleneck.severity,
+                risk_level=risk,
+                applied=auto_apply,
+            )
+            actions.append(action)
+
+        if auto_apply:
+            await asyncio.sleep(0)  # Simulate application
+            logger.info("Auto-applied {} optimisation action(s)", len(actions))
+        else:
+            logger.info("Generated {} optimisation recommendation(s)", len(actions))
+
+        self.optimization_history.extend(actions)
+        return actions
diff --git a/agentic-aiops/agents/security_agent.py b/agentic-aiops/agents/security_agent.py
new file mode 100644
index 0000000..54324aa
--- /dev/null
+++ b/agentic-aiops/agents/security_agent.py
@@ -0,0 +1,309 @@
+"""Security agent for threat detection and automated response."""
+
+from __future__ import annotations
+
+import asyncio
+import hashlib
+import ipaddress
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class ThreatLevel(Enum):
+    """Categorical threat severity levels."""
+
+    NONE = auto()
+    LOW = auto()
+    MEDIUM = auto()
+    HIGH = auto()
+    CRITICAL = auto()
+
+
+@dataclass
+class SecurityEvent:
+    """A raw security event for analysis.
+
+    Attributes:
+        event_id: Unique identifier.
+        source_ip: Origin IP address.
+        event_type: Category (e.g. ``"login_attempt"``, ``"api_call"``).
+        endpoint: Target API endpoint or resource.
+        user_id: Authenticated user (if known).
+        payload_size_bytes: Request payload size.
+        metadata: Additional event attributes.
+        occurred_at: UTC timestamp.
+    """
+
+    event_id: str
+    source_ip: str
+    event_type: str
+    endpoint: str
+    user_id: str = "anonymous"
+    payload_size_bytes: int = 0
+    metadata: dict[str, Any] = field(default_factory=dict)
+    occurred_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class ThreatIndicator:
+    """A detected threat indicator.
+
+    Attributes:
+        threat_id: Unique identifier.
+        threat_level: Severity level.
+        threat_type: Category (e.g. ``"brute_force"``, ``"injection"``).
+        source_ip: Originating IP.
+        description: Human-readable description.
+        evidence: Supporting evidence key-value pairs.
+        detected_at: UTC timestamp.
+        mitigated: Whether the threat has been mitigated.
+    """
+
+    threat_id: str
+    threat_level: ThreatLevel
+    threat_type: str
+    source_ip: str
+    description: str
+    evidence: dict[str, Any] = field(default_factory=dict)
+    detected_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    mitigated: bool = False
+
+
+@dataclass
+class ThreatResponse:
+    """Result of an automated threat response action.
+
+    Attributes:
+        threat_id: Identifier of the mitigated threat.
+        action: Description of the action taken.
+        success: Whether the action succeeded.
+        details: Additional response metadata.
+        responded_at: UTC timestamp.
+    """
+
+    threat_id: str
+    action: str
+    success: bool
+    details: dict[str, Any] = field(default_factory=dict)
+    responded_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class SecurityAgent:
+    """Autonomous security monitoring and response agent.
+
+    Detects threats through pattern analysis and anomaly detection,
+    and executes automated response playbooks.
+
+    Attributes:
+        blocked_ips: Currently blocked IP addresses.
+        threat_log: All detected threats.
+        response_log: All executed response actions.
+        _rate_limit_counters: Request counts per IP for rate limiting.
+        _rate_limit_threshold: Requests per window before blocking.
+    """
+
+    def __init__(self, rate_limit_threshold: int = 100) -> None:
+        """Initialise the security agent.
+
+        Args:
+            rate_limit_threshold: Requests per monitoring window to trigger
+                rate limiting.
+        """
+        self.blocked_ips: set[str] = set()
+        self.threat_log: list[ThreatIndicator] = []
+        self.response_log: list[ThreatResponse] = []
+        self._rate_limit_counters: dict[str, int] = {}
+        self._rate_limit_threshold = rate_limit_threshold
+        self._threat_counter = 0
+        logger.info("SecurityAgent initialised (rate_limit={})", rate_limit_threshold)
+
+    async def scan(self, events: list[SecurityEvent]) -> list[ThreatIndicator]:
+        """Scan a batch of security events for threats.
+
+        Args:
+            events: Security events to analyse.
+
+        Returns:
+            List of detected :class:`ThreatIndicator` objects.
+        """
+        threats: list[ThreatIndicator] = []
+        await asyncio.sleep(0)
+
+        for event in events:
+            detected = self._analyse_event(event)
+            threats.extend(detected)
+
+        self.threat_log.extend(threats)
+        if threats:
+            logger.warning("Scan complete: {} threat(s) detected in {} events", len(threats), len(events))
+        else:
+            logger.debug("Scan clean: {} events analysed", len(events))
+        return threats
+
+    def _analyse_event(self, event: SecurityEvent) -> list[ThreatIndicator]:
+        """Apply detection heuristics to a single event.
+
+        Args:
+            event: The security event to evaluate.
+
+        Returns:
+            List of threats detected (may be empty).
+        """
+        threats: list[ThreatIndicator] = []
+
+        # Rate limiting check
+        if event.source_ip in self.blocked_ips:
+            self._threat_counter += 1
+            threats.append(ThreatIndicator(
+                threat_id=f"threat_{self._threat_counter:06d}",
+                threat_level=ThreatLevel.HIGH,
+                threat_type="blocked_ip_access",
+                source_ip=event.source_ip,
+                description=f"Request from blocked IP {event.source_ip}",
+                evidence={"event_id": event.event_id},
+            ))
+
+        # Increment rate limit counter
+        self._rate_limit_counters[event.source_ip] = (
+            self._rate_limit_counters.get(event.source_ip, 0) + 1
+        )
+        if self._rate_limit_counters[event.source_ip] > self._rate_limit_threshold:
+            self._threat_counter += 1
+            threats.append(ThreatIndicator(
+                threat_id=f"threat_{self._threat_counter:06d}",
+                threat_level=ThreatLevel.MEDIUM,
+                threat_type="rate_limit_exceeded",
+                source_ip=event.source_ip,
+                description=f"IP {event.source_ip} exceeded rate limit",
+                evidence={"count": self._rate_limit_counters[event.source_ip]},
+            ))
+
+        # SQL/command injection detection
+        injection_keywords = ["' OR ", "UNION SELECT", "DROP TABLE", "; rm -", "$(", "${IFS}"]
+        endpoint_lower = event.endpoint.lower()
+        for keyword in injection_keywords:
+            if keyword.lower() in endpoint_lower:
+                self._threat_counter += 1
+                threats.append(ThreatIndicator(
+                    threat_id=f"threat_{self._threat_counter:06d}",
+                    threat_level=ThreatLevel.CRITICAL,
+                    threat_type="injection_attempt",
+                    source_ip=event.source_ip,
+                    description=f"Injection pattern detected in endpoint",
+                    evidence={"keyword": keyword, "endpoint": event.endpoint[:100]},
+                ))
+                break  # One alert per event for injection
+
+        return threats
+
+    async def detect_anomaly(
+        self,
+        events: list[SecurityEvent],
+        baseline_request_rate: float = 10.0,
+    ) -> list[ThreatIndicator]:
+        """Detect statistical anomalies in event patterns.
+
+        Args:
+            events: Recent security events to analyse.
+            baseline_request_rate: Expected average requests per second.
+
+        Returns:
+            List of anomaly-based :class:`ThreatIndicator` objects.
+        """
+        await asyncio.sleep(0)
+        threats: list[ThreatIndicator] = []
+
+        if not events:
+            return threats
+
+        # Group by source IP and check for abnormal volume
+        ip_counts: dict[str, int] = {}
+        for event in events:
+            ip_counts[event.source_ip] = ip_counts.get(event.source_ip, 0) + 1
+
+        counts = np.array(list(ip_counts.values()), dtype=float)
+        if len(counts) < 2:
+            return threats
+
+        mean_count = float(np.mean(counts))
+        std_count = float(np.std(counts, ddof=1)) + 1e-6
+        z_scores = (counts - mean_count) / std_count
+
+        for ip, z_score in zip(ip_counts.keys(), z_scores):
+            if abs(z_score) > 3.0:
+                self._threat_counter += 1
+                threats.append(ThreatIndicator(
+                    threat_id=f"threat_{self._threat_counter:06d}",
+                    threat_level=ThreatLevel.MEDIUM,
+                    threat_type="volume_anomaly",
+                    source_ip=ip,
+                    description=f"Anomalous request volume from {ip} (z={z_score:.2f})",
+                    evidence={"z_score": round(z_score, 2), "count": ip_counts[ip]},
+                ))
+
+        self.threat_log.extend(threats)
+        return threats
+
+    async def respond_to_threat(
+        self,
+        threat: ThreatIndicator,
+    ) -> ThreatResponse:
+        """Execute an automated response to a detected threat.
+
+        Args:
+            threat: The threat to respond to.
+
+        Returns:
+            :class:`ThreatResponse` documenting the action taken.
+
+        Raises:
+            ValueError: If ``threat`` has already been mitigated.
+        """
+        if threat.mitigated:
+            raise ValueError(f"Threat '{threat.threat_id}' is already mitigated")
+
+        await asyncio.sleep(0)
+        action, success = self._select_response(threat)
+        threat.mitigated = success
+
+        response = ThreatResponse(
+            threat_id=threat.threat_id,
+            action=action,
+            success=success,
+            details={
+                "threat_type": threat.threat_type,
+                "threat_level": threat.threat_level.name,
+                "source_ip": threat.source_ip,
+            },
+        )
+        self.response_log.append(response)
+        log = logger.warning if success else logger.error
+        log(
+            "Threat '{}' response: {} → {}",
+            threat.threat_id,
+            action,
+            "SUCCESS" if success else "FAILED",
+        )
+        return response
+
+    def _select_response(self, threat: ThreatIndicator) -> tuple[str, bool]:
+        """Choose and simulate a response action for a threat.
+
+        Args:
+            threat: Threat to respond to.
+
+        Returns:
+            Tuple of ``(action_description, success_flag)``.
+        """
+        if threat.threat_level in (ThreatLevel.HIGH, ThreatLevel.CRITICAL):
+            self.blocked_ips.add(threat.source_ip)
+            return f"IP {threat.source_ip} blocked permanently", True
+        if threat.threat_level == ThreatLevel.MEDIUM:
+            self._rate_limit_counters[threat.source_ip] = 0
+            return f"Rate limit reset for {threat.source_ip}", True
+        return "Event logged for review", True
diff --git a/agentic-aiops/anomaly_detection/__init__.py b/agentic-aiops/anomaly_detection/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/agentic-aiops/anomaly_detection/__pycache__/__init__.cpython-312.pyc b/agentic-aiops/anomaly_detection/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..da57800
Binary files /dev/null and b/agentic-aiops/anomaly_detection/__pycache__/__init__.cpython-312.pyc differ
diff --git a/agentic-aiops/anomaly_detection/__pycache__/behavior_anomaly.cpython-312.pyc b/agentic-aiops/anomaly_detection/__pycache__/behavior_anomaly.cpython-312.pyc
new file mode 100644
index 0000000..0d382f4
Binary files /dev/null and b/agentic-aiops/anomaly_detection/__pycache__/behavior_anomaly.cpython-312.pyc differ
diff --git a/agentic-aiops/anomaly_detection/__pycache__/log_anomaly.cpython-312.pyc b/agentic-aiops/anomaly_detection/__pycache__/log_anomaly.cpython-312.pyc
new file mode 100644
index 0000000..aaf5c37
Binary files /dev/null and b/agentic-aiops/anomaly_detection/__pycache__/log_anomaly.cpython-312.pyc differ
diff --git a/agentic-aiops/anomaly_detection/__pycache__/time_series_anomaly.cpython-312.pyc b/agentic-aiops/anomaly_detection/__pycache__/time_series_anomaly.cpython-312.pyc
new file mode 100644
index 0000000..2a36e4e
Binary files /dev/null and b/agentic-aiops/anomaly_detection/__pycache__/time_series_anomaly.cpython-312.pyc differ
diff --git a/agentic-aiops/anomaly_detection/behavior_anomaly.py b/agentic-aiops/anomaly_detection/behavior_anomaly.py
new file mode 100644
index 0000000..0300b55
--- /dev/null
+++ b/agentic-aiops/anomaly_detection/behavior_anomaly.py
@@ -0,0 +1,243 @@
+"""Behavioral anomaly detection using baseline comparison."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class BehaviorProfile:
+    """Baseline behavioral profile for a user or system component.
+
+    Attributes:
+        entity_id: Identifier for the user/component being profiled.
+        feature_means: Per-feature mean values from baseline.
+        feature_stds: Per-feature standard deviations from baseline.
+        feature_names: Ordered list of feature names.
+        n_samples: Number of samples used to build the baseline.
+        built_at: UTC timestamp when the baseline was built.
+    """
+
+    entity_id: str
+    feature_means: np.ndarray
+    feature_stds: np.ndarray
+    feature_names: list[str]
+    n_samples: int
+    built_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class BehaviorAnomalyResult:
+    """Result of a behavioral anomaly check.
+
+    Attributes:
+        entity_id: Checked entity identifier.
+        is_anomaly: Whether anomalous behaviour was detected.
+        anomaly_score: Overall anomaly score (0–1, higher = more anomalous).
+        anomalous_features: Features that contributed to the detection.
+        feature_scores: Per-feature anomaly scores.
+        detected_at: UTC timestamp.
+    """
+
+    entity_id: str
+    is_anomaly: bool
+    anomaly_score: float
+    anomalous_features: list[str]
+    feature_scores: dict[str, float] = field(default_factory=dict)
+    detected_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class BehaviorAnomaly:
+    """Behavioral anomaly detection using baseline comparison.
+
+    Builds per-entity baseline profiles and flags new observations that
+    deviate significantly using a Mahalanobis-inspired distance metric.
+
+    Attributes:
+        profiles: Baseline profiles keyed by entity_id.
+        detection_history: All past anomaly results.
+        _zscore_threshold: Feature Z-score threshold.
+        _global_threshold: Global anomaly score threshold (0–1).
+    """
+
+    def __init__(
+        self,
+        zscore_threshold: float = 3.0,
+        global_threshold: float = 0.7,
+    ) -> None:
+        """Initialise the behavioral anomaly detector.
+
+        Args:
+            zscore_threshold: Per-feature Z-score above which a feature is
+                flagged.
+            global_threshold: Overall anomaly score threshold for declaring
+                anomalous behaviour.
+        """
+        self.profiles: dict[str, BehaviorProfile] = {}
+        self.detection_history: list[BehaviorAnomalyResult] = []
+        self._zscore_threshold = zscore_threshold
+        self._global_threshold = global_threshold
+        logger.info(
+            "BehaviorAnomaly initialised (zscore={}, global={})",
+            zscore_threshold,
+            global_threshold,
+        )
+
+    def build_profile(
+        self,
+        entity_id: str,
+        observations: np.ndarray,
+        feature_names: list[str] | None = None,
+    ) -> BehaviorProfile:
+        """Build a baseline behavioral profile for an entity.
+
+        Args:
+            entity_id: Entity identifier.
+            observations: 2-D array of shape (n_samples, n_features).
+            feature_names: Optional feature labels.
+
+        Returns:
+            The built :class:`BehaviorProfile`.
+
+        Raises:
+            ValueError: If ``observations`` has fewer than 10 samples.
+            ValueError: If ``observations`` is not 2-D.
+        """
+        observations = np.atleast_2d(np.asarray(observations, dtype=float))
+        if observations.ndim != 2:
+            raise ValueError("observations must be 2-D (n_samples × n_features)")
+        n_samples, n_features = observations.shape
+        if n_samples < 10:
+            raise ValueError(f"Baseline requires ≥10 samples, got {n_samples}")
+
+        if feature_names is None:
+            feature_names = [f"feature_{i}" for i in range(n_features)]
+        if len(feature_names) != n_features:
+            raise ValueError(
+                f"feature_names length {len(feature_names)} != n_features {n_features}"
+            )
+
+        means = np.mean(observations, axis=0)
+        stds = np.std(observations, axis=0, ddof=1) + 1e-10
+
+        profile = BehaviorProfile(
+            entity_id=entity_id,
+            feature_means=means,
+            feature_stds=stds,
+            feature_names=feature_names,
+            n_samples=n_samples,
+        )
+        self.profiles[entity_id] = profile
+        logger.info(
+            "Behavior profile built for '{}': {} features, {} samples",
+            entity_id,
+            n_features,
+            n_samples,
+        )
+        return profile
+
+    def detect(
+        self,
+        entity_id: str,
+        observation: np.ndarray,
+    ) -> BehaviorAnomalyResult:
+        """Compare a new observation against the entity's baseline profile.
+
+        Args:
+            entity_id: Entity to check.
+            observation: 1-D feature vector (must match profile dimensions).
+
+        Returns:
+            :class:`BehaviorAnomalyResult` with anomaly classification.
+
+        Raises:
+            KeyError: If no profile exists for ``entity_id``.
+            ValueError: If ``observation`` has the wrong number of features.
+        """
+        profile = self._get_profile(entity_id)
+        observation = np.asarray(observation, dtype=float).ravel()
+
+        if len(observation) != len(profile.feature_means):
+            raise ValueError(
+                f"observation has {len(observation)} features, "
+                f"profile expects {len(profile.feature_means)}"
+            )
+
+        z_scores = np.abs((observation - profile.feature_means) / profile.feature_stds)
+        anomalous_features: list[str] = []
+        feature_scores: dict[str, float] = {}
+
+        for i, (name, z) in enumerate(zip(profile.feature_names, z_scores)):
+            score = float(min(1.0, z / (self._zscore_threshold * 2 + 1e-10)))
+            feature_scores[name] = round(score, 4)
+            if z > self._zscore_threshold:
+                anomalous_features.append(name)
+
+        # Global score = fraction of features exceeding threshold, weighted by score
+        global_score = float(np.mean(list(feature_scores.values())))
+        is_anomaly = (
+            global_score >= self._global_threshold
+            or len(anomalous_features) / max(len(profile.feature_names), 1) > 0.5
+        )
+
+        result = BehaviorAnomalyResult(
+            entity_id=entity_id,
+            is_anomaly=is_anomaly,
+            anomaly_score=round(global_score, 4),
+            anomalous_features=anomalous_features,
+            feature_scores=feature_scores,
+        )
+        self.detection_history.append(result)
+
+        if is_anomaly:
+            logger.warning(
+                "Behavioral anomaly for '{}': score={:.4f}, features={}",
+                entity_id,
+                global_score,
+                anomalous_features,
+            )
+        else:
+            logger.debug("Behavior check OK for '{}' (score={:.4f})", entity_id, global_score)
+
+        return result
+
+    def batch_detect(
+        self,
+        entity_id: str,
+        observations: np.ndarray,
+    ) -> list[BehaviorAnomalyResult]:
+        """Detect anomalies across multiple observations.
+
+        Args:
+            entity_id: Entity to check.
+            observations: 2-D array of shape (n_obs, n_features).
+
+        Returns:
+            List of :class:`BehaviorAnomalyResult` for each observation.
+        """
+        observations = np.atleast_2d(np.asarray(observations, dtype=float))
+        return [self.detect(entity_id, obs) for obs in observations]
+
+    def _get_profile(self, entity_id: str) -> BehaviorProfile:
+        """Retrieve a profile, raising KeyError if not found.
+
+        Args:
+            entity_id: Entity identifier.
+
+        Returns:
+            The :class:`BehaviorProfile`.
+
+        Raises:
+            KeyError: If no profile has been built.
+        """
+        if entity_id not in self.profiles:
+            raise KeyError(
+                f"No baseline profile for entity '{entity_id}'. "
+                "Call build_profile() first."
+            )
+        return self.profiles[entity_id]
diff --git a/agentic-aiops/anomaly_detection/log_anomaly.py b/agentic-aiops/anomaly_detection/log_anomaly.py
new file mode 100644
index 0000000..ee9983d
--- /dev/null
+++ b/agentic-aiops/anomaly_detection/log_anomaly.py
@@ -0,0 +1,222 @@
+"""Log pattern anomaly detection using frequency analysis."""
+
+from __future__ import annotations
+
+import re
+from collections import Counter
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class LogAnomaly:
+    """A detected anomalous log pattern.
+
+    Attributes:
+        pattern: The anomalous log pattern or message template.
+        frequency: How often this pattern appeared in the current window.
+        expected_frequency: Expected frequency from the baseline.
+        frequency_ratio: current / expected (>1 = more common, <1 = less common).
+        anomaly_score: Normalised anomaly score (0–1).
+        is_anomaly: Whether this pattern is classified as anomalous.
+        sample_messages: Up to 3 example raw log lines.
+        detected_at: UTC timestamp.
+    """
+
+    pattern: str
+    frequency: int
+    expected_frequency: float
+    frequency_ratio: float
+    anomaly_score: float
+    is_anomaly: bool
+    sample_messages: list[str] = field(default_factory=list)
+    detected_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+# Regex templates for normalising log messages into patterns
+_NORMALISATION_RULES: list[tuple[re.Pattern[str], str]] = [
+    (re.compile(r"\b\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}\b"), "<IP>"),
+    (re.compile(r"\b[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}\b", re.IGNORECASE), "<UUID>"),
+    (re.compile(r"\b\d{4}-\d{2}-\d{2}[T ]\d{2}:\d{2}:\d{2}(?:\.\d+)?(?:Z|[+-]\d{2}:\d{2})?\b"), "<TIMESTAMP>"),
+    (re.compile(r"\b\d+\b"), "<NUM>"),
+    (re.compile(r'"[^"]{0,200}"'), "<STR>"),
+]
+
+
+class LogAnomalyDetector:
+    """Log pattern anomaly detection using frequency-based analysis.
+
+    Maintains a baseline pattern frequency distribution and detects
+    new log windows that deviate significantly.
+
+    Attributes:
+        baseline_frequencies: Pattern → expected frequency per window.
+        detection_history: All past detection results.
+        _z_threshold: Z-score threshold for frequency anomalies.
+        _new_pattern_threshold: Fraction of messages in new patterns
+            above which a new-pattern alert fires.
+    """
+
+    def __init__(
+        self,
+        z_threshold: float = 3.0,
+        new_pattern_threshold: float = 0.1,
+    ) -> None:
+        """Initialise the log anomaly detector.
+
+        Args:
+            z_threshold: Z-score threshold for frequency anomalies.
+            new_pattern_threshold: Fraction of new patterns that triggers
+                an alert.
+        """
+        self.baseline_frequencies: dict[str, float] = {}
+        self.detection_history: list[LogAnomaly] = []
+        self._z_threshold = z_threshold
+        self._new_pattern_threshold = new_pattern_threshold
+        self._baseline_std: dict[str, float] = {}
+        logger.info("LogAnomalyDetector initialised (z={}, new_pat={})", z_threshold, new_pattern_threshold)
+
+    def build_baseline(self, log_lines: list[str]) -> dict[str, float]:
+        """Build a frequency baseline from a reference log corpus.
+
+        Args:
+            log_lines: List of reference log message strings.
+
+        Returns:
+            Mapping of pattern → mean frequency count.
+
+        Raises:
+            ValueError: If ``log_lines`` is empty.
+        """
+        if not log_lines:
+            raise ValueError("log_lines must not be empty")
+
+        patterns = [self._normalise(line) for line in log_lines]
+        counts = Counter(patterns)
+        total = len(log_lines)
+
+        # Store as fraction for normalised comparison
+        self.baseline_frequencies = {
+            pat: count / total for pat, count in counts.items()
+        }
+        # Use a heuristic std: assume Poisson-like (std ≈ sqrt(mean))
+        self._baseline_std = {
+            pat: max(1e-4, (freq / total) ** 0.5 / total)
+            for pat, freq in counts.items()
+        }
+        logger.info("Baseline built: {} unique patterns from {} lines", len(counts), total)
+        return dict(self.baseline_frequencies)
+
+    def detect(
+        self,
+        log_lines: list[str],
+        *,
+        return_all: bool = False,
+    ) -> list[LogAnomaly]:
+        """Detect anomalous patterns in a new log window.
+
+        Args:
+            log_lines: Current log lines to analyse.
+            return_all: If ``True``, return results for all patterns (not
+                just anomalies).
+
+        Returns:
+            List of :class:`LogAnomaly` for detected anomalies
+            (or all patterns if ``return_all=True``).
+
+        Raises:
+            RuntimeError: If no baseline has been built yet.
+            ValueError: If ``log_lines`` is empty.
+        """
+        if not self.baseline_frequencies:
+            raise RuntimeError("Baseline not built. Call build_baseline() first.")
+        if not log_lines:
+            raise ValueError("log_lines must not be empty")
+
+        total = len(log_lines)
+        patterns = [self._normalise(line) for line in log_lines]
+        current_counts = Counter(patterns)
+        current_freqs = {pat: count / total for pat, count in current_counts.items()}
+
+        # Sample messages per pattern
+        sample_map: dict[str, list[str]] = {}
+        for line, pat in zip(log_lines, patterns):
+            if pat not in sample_map:
+                sample_map[pat] = []
+            if len(sample_map[pat]) < 3:
+                sample_map[pat].append(line[:200])
+
+        results: list[LogAnomaly] = []
+        new_pattern_count = 0
+
+        all_patterns = set(self.baseline_frequencies) | set(current_freqs)
+
+        for pattern in all_patterns:
+            current_freq = current_freqs.get(pattern, 0.0)
+            expected_freq = self.baseline_frequencies.get(pattern, 0.0)
+            raw_count = current_counts.get(pattern, 0)
+
+            is_new = pattern not in self.baseline_frequencies
+            if is_new:
+                new_pattern_count += 1
+
+            # Anomaly score based on normalised deviation
+            if expected_freq < 1e-10:
+                score = min(1.0, current_freq * 10.0) if current_freq > 0 else 0.0
+                is_anomaly = current_freq > self._new_pattern_threshold
+            else:
+                ratio = current_freq / expected_freq
+                score = min(1.0, abs(ratio - 1.0))
+                std = self._baseline_std.get(pattern, 1e-4)
+                z = abs((current_freq - expected_freq) / std)
+                is_anomaly = z > self._z_threshold
+
+            ratio = current_freq / (expected_freq + 1e-10)
+            anomaly = LogAnomaly(
+                pattern=pattern[:200],
+                frequency=raw_count,
+                expected_frequency=round(expected_freq * total, 2),
+                frequency_ratio=round(float(ratio), 4),
+                anomaly_score=round(score, 4),
+                is_anomaly=is_anomaly,
+                sample_messages=sample_map.get(pattern, []),
+            )
+            if is_anomaly or return_all:
+                results.append(anomaly)
+
+        # Check for new pattern rate
+        new_rate = new_pattern_count / max(len(all_patterns), 1)
+        if new_rate > self._new_pattern_threshold:
+            logger.warning(
+                "High new pattern rate: {:.1%} ({} new patterns)",
+                new_rate,
+                new_pattern_count,
+            )
+
+        anomalies = [r for r in results if r.is_anomaly]
+        self.detection_history.extend(anomalies)
+
+        if anomalies:
+            logger.warning("{} log anomalies detected in {} lines", len(anomalies), total)
+        else:
+            logger.debug("No log anomalies in {} lines", total)
+
+        return results if return_all else anomalies
+
+    def _normalise(self, line: str) -> str:
+        """Normalise a log line into a pattern by replacing variable parts.
+
+        Args:
+            line: Raw log message.
+
+        Returns:
+            Normalised pattern string.
+        """
+        result = line.strip()
+        for pattern, replacement in _NORMALISATION_RULES:
+            result = pattern.sub(replacement, result)
+        return result[:200]  # Truncate for memory efficiency
diff --git a/agentic-aiops/anomaly_detection/time_series_anomaly.py b/agentic-aiops/anomaly_detection/time_series_anomaly.py
new file mode 100644
index 0000000..e05856d
--- /dev/null
+++ b/agentic-aiops/anomaly_detection/time_series_anomaly.py
@@ -0,0 +1,253 @@
+"""Time-series anomaly detection using Z-score and IQR methods."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class TimeSeriesAnomalyResult:
+    """Result of a time-series anomaly detection run.
+
+    Attributes:
+        metric_name: Name of the evaluated metric.
+        method: Detection method used (``"zscore"`` or ``"iqr"``).
+        anomaly_indices: Indices of detected anomalies in the input array.
+        anomaly_scores: Corresponding anomaly scores.
+        threshold: Detection threshold used.
+        n_anomalies: Total number of anomalies detected.
+        detected_at: UTC timestamp.
+    """
+
+    metric_name: str
+    method: str
+    anomaly_indices: list[int]
+    anomaly_scores: list[float]
+    threshold: float
+    n_anomalies: int
+    detected_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class TimeSeriesAnomaly:
+    """Z-score and IQR based anomaly detection for system metrics.
+
+    Provides two complementary methods:
+    - **Z-score**: Robust for roughly Gaussian metrics (CPU, memory).
+    - **IQR**: Robust for skewed or heavy-tailed metrics (latency, errors).
+
+    Attributes:
+        detection_history: All past detection results.
+        _zscore_threshold: Z-score threshold for anomaly classification.
+        _iqr_multiplier: IQR multiplier for fence calculation.
+    """
+
+    def __init__(
+        self,
+        zscore_threshold: float = 3.0,
+        iqr_multiplier: float = 1.5,
+    ) -> None:
+        """Initialise the time-series anomaly detector.
+
+        Args:
+            zscore_threshold: Z-score absolute value above which a point is
+                anomalous (default 3.0 = ~0.3% false positive rate).
+            iqr_multiplier: Multiplier for IQR fence (1.5 = mild, 3.0 = extreme).
+        """
+        self.detection_history: list[TimeSeriesAnomalyResult] = []
+        self._zscore_threshold = zscore_threshold
+        self._iqr_multiplier = iqr_multiplier
+        logger.info(
+            "TimeSeriesAnomaly initialised (zscore={}, iqr_mult={})",
+            zscore_threshold,
+            iqr_multiplier,
+        )
+
+    def detect_zscore(
+        self,
+        data: np.ndarray,
+        metric_name: str = "metric",
+        threshold: float | None = None,
+    ) -> TimeSeriesAnomalyResult:
+        """Detect anomalies using a modified Z-score (median-based).
+
+        Uses the median absolute deviation (MAD) for robustness against
+        existing outliers corrupting the mean/std estimates.
+
+        Args:
+            data: 1-D array of metric values (time-ordered).
+            metric_name: Name for labelling the result.
+            threshold: Override the default Z-score threshold.
+
+        Returns:
+            :class:`TimeSeriesAnomalyResult` with detected anomaly indices.
+
+        Raises:
+            ValueError: If ``data`` has fewer than 5 samples.
+        """
+        data = np.asarray(data, dtype=float)
+        if len(data) < 5:
+            raise ValueError(f"data must have ≥5 samples, got {len(data)}")
+
+        threshold = threshold or self._zscore_threshold
+        median = float(np.median(data))
+        mad = float(np.median(np.abs(data - median)))
+        mad_std = mad * 1.4826  # Consistency factor for normal distribution
+
+        if mad_std < 1e-10:
+            # All values identical — no anomalies
+            z_scores = np.zeros(len(data))
+        else:
+            z_scores = np.abs(data - median) / mad_std
+
+        anomaly_mask = z_scores > threshold
+        anomaly_indices = list(np.where(anomaly_mask)[0].astype(int))
+        anomaly_scores = [round(float(z_scores[i]), 4) for i in anomaly_indices]
+
+        result = TimeSeriesAnomalyResult(
+            metric_name=metric_name,
+            method="zscore",
+            anomaly_indices=anomaly_indices,
+            anomaly_scores=anomaly_scores,
+            threshold=threshold,
+            n_anomalies=len(anomaly_indices),
+        )
+        self.detection_history.append(result)
+
+        if anomaly_indices:
+            logger.warning(
+                "Z-score: {} anomalies in '{}' at indices {}",
+                len(anomaly_indices),
+                metric_name,
+                anomaly_indices[:10],
+            )
+        else:
+            logger.debug("Z-score: no anomalies in '{}'", metric_name)
+
+        return result
+
+    def detect_iqr(
+        self,
+        data: np.ndarray,
+        metric_name: str = "metric",
+        multiplier: float | None = None,
+    ) -> TimeSeriesAnomalyResult:
+        """Detect anomalies using the IQR (Tukey fence) method.
+
+        Args:
+            data: 1-D array of metric values (time-ordered).
+            metric_name: Name for labelling the result.
+            multiplier: Override the default IQR multiplier.
+
+        Returns:
+            :class:`TimeSeriesAnomalyResult` with detected anomaly indices.
+
+        Raises:
+            ValueError: If ``data`` has fewer than 5 samples.
+        """
+        data = np.asarray(data, dtype=float)
+        if len(data) < 5:
+            raise ValueError(f"data must have ≥5 samples, got {len(data)}")
+
+        mult = multiplier or self._iqr_multiplier
+        q1, q3 = float(np.percentile(data, 25)), float(np.percentile(data, 75))
+        iqr = q3 - q1
+        lower_fence = q1 - mult * iqr
+        upper_fence = q3 + mult * iqr
+
+        anomaly_mask = (data < lower_fence) | (data > upper_fence)
+        anomaly_indices = list(np.where(anomaly_mask)[0].astype(int))
+
+        # Score = normalised distance outside the fence
+        scores: list[float] = []
+        for i in anomaly_indices:
+            if data[i] < lower_fence:
+                score = (lower_fence - data[i]) / (iqr + 1e-10)
+            else:
+                score = (data[i] - upper_fence) / (iqr + 1e-10)
+            scores.append(round(float(score), 4))
+
+        result = TimeSeriesAnomalyResult(
+            metric_name=metric_name,
+            method="iqr",
+            anomaly_indices=anomaly_indices,
+            anomaly_scores=scores,
+            threshold=mult,
+            n_anomalies=len(anomaly_indices),
+        )
+        self.detection_history.append(result)
+
+        if anomaly_indices:
+            logger.warning(
+                "IQR: {} anomalies in '{}' (fences [{:.2f}, {:.2f}])",
+                len(anomaly_indices),
+                metric_name,
+                lower_fence,
+                upper_fence,
+            )
+        else:
+            logger.debug(
+                "IQR: no anomalies in '{}' (fences [{:.2f}, {:.2f}])",
+                metric_name,
+                lower_fence,
+                upper_fence,
+            )
+
+        return result
+
+    def detect_rolling_zscore(
+        self,
+        data: np.ndarray,
+        metric_name: str = "metric",
+        window: int = 20,
+        threshold: float | None = None,
+    ) -> TimeSeriesAnomalyResult:
+        """Detect anomalies using a rolling window Z-score.
+
+        Suitable for non-stationary time series where the baseline drifts.
+
+        Args:
+            data: 1-D array of metric values.
+            metric_name: Metric label.
+            window: Rolling window size.
+            threshold: Z-score threshold override.
+
+        Returns:
+            :class:`TimeSeriesAnomalyResult`.
+
+        Raises:
+            ValueError: If ``len(data) < window``.
+        """
+        data = np.asarray(data, dtype=float)
+        if len(data) < window:
+            raise ValueError(f"data length {len(data)} < window {window}")
+
+        threshold = threshold or self._zscore_threshold
+        z_scores = np.zeros(len(data))
+
+        for i in range(window, len(data)):
+            window_data = data[i - window: i]
+            w_mean = float(np.mean(window_data))
+            w_std = float(np.std(window_data, ddof=1)) + 1e-10
+            z_scores[i] = abs((data[i] - w_mean) / w_std)
+
+        anomaly_mask = z_scores > threshold
+        anomaly_indices = list(np.where(anomaly_mask)[0].astype(int))
+        anomaly_scores = [round(float(z_scores[i]), 4) for i in anomaly_indices]
+
+        result = TimeSeriesAnomalyResult(
+            metric_name=metric_name,
+            method="rolling_zscore",
+            anomaly_indices=anomaly_indices,
+            anomaly_scores=anomaly_scores,
+            threshold=threshold,
+            n_anomalies=len(anomaly_indices),
+        )
+        self.detection_history.append(result)
+        logger.debug(
+            "Rolling Z-score: {} anomalies in '{}'", len(anomaly_indices), metric_name
+        )
+        return result
diff --git a/agentic-aiops/automation/__init__.py b/agentic-aiops/automation/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/agentic-aiops/automation/__pycache__/__init__.cpython-312.pyc b/agentic-aiops/automation/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..f7fac8b
Binary files /dev/null and b/agentic-aiops/automation/__pycache__/__init__.cpython-312.pyc differ
diff --git a/agentic-aiops/automation/__pycache__/capacity_planning.cpython-312.pyc b/agentic-aiops/automation/__pycache__/capacity_planning.cpython-312.pyc
new file mode 100644
index 0000000..e9170b9
Binary files /dev/null and b/agentic-aiops/automation/__pycache__/capacity_planning.cpython-312.pyc differ
diff --git a/agentic-aiops/automation/__pycache__/chaos_engineering.cpython-312.pyc b/agentic-aiops/automation/__pycache__/chaos_engineering.cpython-312.pyc
new file mode 100644
index 0000000..b06d353
Binary files /dev/null and b/agentic-aiops/automation/__pycache__/chaos_engineering.cpython-312.pyc differ
diff --git a/agentic-aiops/automation/__pycache__/incident_response.cpython-312.pyc b/agentic-aiops/automation/__pycache__/incident_response.cpython-312.pyc
new file mode 100644
index 0000000..4cab0a0
Binary files /dev/null and b/agentic-aiops/automation/__pycache__/incident_response.cpython-312.pyc differ
diff --git a/agentic-aiops/automation/capacity_planning.py b/agentic-aiops/automation/capacity_planning.py
new file mode 100644
index 0000000..a9ecc10
--- /dev/null
+++ b/agentic-aiops/automation/capacity_planning.py
@@ -0,0 +1,289 @@
+"""Capacity planning with auto-scaling logic based on usage trends."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class CapacityMetrics:
+    """Resource utilisation metrics for capacity planning.
+
+    Attributes:
+        component: Service or resource identifier.
+        cpu_utilisation: CPU utilisation fraction (0–1).
+        memory_utilisation: Memory utilisation fraction (0–1).
+        request_rate: Requests per second.
+        current_replicas: Current number of running instances.
+        max_replicas: Configured maximum replicas.
+        min_replicas: Configured minimum replicas.
+        collected_at: UTC timestamp.
+    """
+
+    component: str
+    cpu_utilisation: float
+    memory_utilisation: float
+    request_rate: float
+    current_replicas: int
+    max_replicas: int
+    min_replicas: int = 1
+    collected_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class ScalingDecision:
+    """An auto-scaling recommendation.
+
+    Attributes:
+        component: Target component.
+        action: ``"scale_up"``, ``"scale_down"``, or ``"no_change"``.
+        current_replicas: Replicas before the action.
+        recommended_replicas: Recommended new replica count.
+        reason: Human-readable justification.
+        confidence: Decision confidence (0–1).
+        decided_at: UTC timestamp.
+    """
+
+    component: str
+    action: str
+    current_replicas: int
+    recommended_replicas: int
+    reason: str
+    confidence: float
+    decided_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class ForecastResult:
+    """Resource usage forecast.
+
+    Attributes:
+        component: Forecasted component.
+        horizon_hours: Forecast horizon in hours.
+        forecasted_cpu: Predicted CPU utilisation per hour.
+        forecasted_requests: Predicted request rate per hour.
+        capacity_breach_hour: Hour index at which capacity is breached
+            (None if no breach predicted).
+        recommended_scale_by: Recommended additional replicas.
+    """
+
+    component: str
+    horizon_hours: int
+    forecasted_cpu: list[float]
+    forecasted_requests: list[float]
+    capacity_breach_hour: int | None
+    recommended_scale_by: int
+
+
+class CapacityPlanning:
+    """Auto-scaling and capacity planning based on usage trends and forecasting.
+
+    Uses linear trend extrapolation for short-horizon forecasts and
+    rule-based threshold logic for scaling decisions.
+
+    Attributes:
+        metrics_history: Per-component time-series of metric snapshots.
+        scaling_history: Log of all scaling decisions.
+        _cpu_scale_up_threshold: CPU fraction triggering scale-up.
+        _cpu_scale_down_threshold: CPU fraction triggering scale-down.
+        _request_rate_scale_factor: Requests/replica target.
+    """
+
+    def __init__(
+        self,
+        cpu_scale_up: float = 0.75,
+        cpu_scale_down: float = 0.25,
+        request_rate_per_replica: float = 100.0,
+    ) -> None:
+        """Initialise the capacity planner.
+
+        Args:
+            cpu_scale_up: CPU utilisation fraction above which scale-up triggers.
+            cpu_scale_down: CPU utilisation fraction below which scale-down triggers.
+            request_rate_per_replica: Target requests/sec per replica.
+        """
+        self.metrics_history: dict[str, list[CapacityMetrics]] = {}
+        self.scaling_history: list[ScalingDecision] = []
+        self._cpu_scale_up_threshold = cpu_scale_up
+        self._cpu_scale_down_threshold = cpu_scale_down
+        self._request_rate_per_replica = request_rate_per_replica
+        logger.info(
+            "CapacityPlanning initialised (cpu_up={}, cpu_down={}, rps_per_replica={})",
+            cpu_scale_up,
+            cpu_scale_down,
+            request_rate_per_replica,
+        )
+
+    def record_metrics(self, metrics: CapacityMetrics) -> None:
+        """Record a capacity metrics snapshot.
+
+        Args:
+            metrics: Metrics snapshot to store.
+        """
+        component = metrics.component
+        if component not in self.metrics_history:
+            self.metrics_history[component] = []
+        self.metrics_history[component].append(metrics)
+        logger.debug(
+            "Capacity metrics recorded for '{}': cpu={:.1%}, mem={:.1%}, rps={:.1f}",
+            component,
+            metrics.cpu_utilisation,
+            metrics.memory_utilisation,
+            metrics.request_rate,
+        )
+
+    def decide_scaling(self, metrics: CapacityMetrics) -> ScalingDecision:
+        """Determine whether to scale a component up or down.
+
+        Uses CPU utilisation and request rate to compute the recommended
+        replica count.
+
+        Args:
+            metrics: Current resource metrics.
+
+        Returns:
+            :class:`ScalingDecision` recommendation.
+        """
+        component = metrics.component
+        current = metrics.current_replicas
+
+        # Compute replica target from request rate
+        rps_target = max(
+            metrics.min_replicas,
+            int(np.ceil(metrics.request_rate / self._request_rate_per_replica)),
+        )
+
+        # Apply CPU-based adjustment
+        if metrics.cpu_utilisation > self._cpu_scale_up_threshold:
+            cpu_target = min(metrics.max_replicas, current + max(1, current // 2))
+            reason = f"CPU at {metrics.cpu_utilisation:.1%} > {self._cpu_scale_up_threshold:.0%} threshold"
+            action = "scale_up"
+        elif metrics.cpu_utilisation < self._cpu_scale_down_threshold and current > metrics.min_replicas:
+            cpu_target = max(metrics.min_replicas, current - 1)
+            reason = f"CPU at {metrics.cpu_utilisation:.1%} < {self._cpu_scale_down_threshold:.0%} threshold"
+            action = "scale_down"
+        else:
+            cpu_target = current
+            reason = f"CPU at {metrics.cpu_utilisation:.1%} within thresholds"
+            action = "no_change"
+
+        recommended = max(rps_target, cpu_target)
+        recommended = int(np.clip(recommended, metrics.min_replicas, metrics.max_replicas))
+
+        if recommended > current:
+            action = "scale_up"
+        elif recommended < current:
+            action = "scale_down"
+        else:
+            action = "no_change"
+            recommended = current
+
+        confidence = self._compute_confidence(metrics)
+        decision = ScalingDecision(
+            component=component,
+            action=action,
+            current_replicas=current,
+            recommended_replicas=recommended,
+            reason=reason,
+            confidence=round(confidence, 4),
+        )
+        self.scaling_history.append(decision)
+        logger.info(
+            "Scaling decision for '{}': {} ({} → {} replicas)",
+            component,
+            action,
+            current,
+            recommended,
+        )
+        return decision
+
+    def forecast(
+        self,
+        component: str,
+        horizon_hours: int = 24,
+    ) -> ForecastResult:
+        """Forecast resource usage using linear trend extrapolation.
+
+        Args:
+            component: Component to forecast.
+            horizon_hours: Number of hours ahead to forecast.
+
+        Returns:
+            :class:`ForecastResult` with per-hour predictions.
+
+        Raises:
+            ValueError: If fewer than 2 metric snapshots are available.
+            KeyError: If no metrics history for this component.
+        """
+        if component not in self.metrics_history:
+            raise KeyError(f"No metrics history for component '{component}'")
+
+        history = self.metrics_history[component]
+        if len(history) < 2:
+            raise ValueError(f"Need ≥2 samples for forecasting, got {len(history)}")
+
+        cpu_values = np.array([m.cpu_utilisation for m in history])
+        rps_values = np.array([m.request_rate for m in history])
+        n = len(cpu_values)
+        t = np.arange(n, dtype=float)
+
+        # Linear regression
+        cpu_slope, cpu_intercept = float(np.polyfit(t, cpu_values, 1))
+        rps_slope, rps_intercept = float(np.polyfit(t, rps_values, 1))
+
+        last_metrics = history[-1]
+        forecast_cpu: list[float] = []
+        forecast_rps: list[float] = []
+        breach_hour: int | None = None
+
+        for h in range(horizon_hours):
+            t_future = n + h
+            cpu_pred = float(np.clip(cpu_slope * t_future + cpu_intercept, 0.0, 1.0))
+            rps_pred = float(max(0.0, rps_slope * t_future + rps_intercept))
+            forecast_cpu.append(round(cpu_pred, 4))
+            forecast_rps.append(round(rps_pred, 2))
+
+            if breach_hour is None and cpu_pred > self._cpu_scale_up_threshold:
+                breach_hour = h
+
+        max_rps = max(forecast_rps) if forecast_rps else 0.0
+        recommended_scale = max(
+            0,
+            int(np.ceil(max_rps / self._request_rate_per_replica)) - last_metrics.current_replicas,
+        )
+
+        result = ForecastResult(
+            component=component,
+            horizon_hours=horizon_hours,
+            forecasted_cpu=forecast_cpu,
+            forecasted_requests=forecast_rps,
+            capacity_breach_hour=breach_hour,
+            recommended_scale_by=recommended_scale,
+        )
+        logger.info(
+            "Forecast for '{}': horizon={}h, breach_hour={}, scale_by={}",
+            component,
+            horizon_hours,
+            breach_hour,
+            recommended_scale,
+        )
+        return result
+
+    def _compute_confidence(self, metrics: CapacityMetrics) -> float:
+        """Compute confidence in a scaling decision.
+
+        Args:
+            metrics: Current metrics snapshot.
+
+        Returns:
+            Confidence score (0–1).
+        """
+        history = self.metrics_history.get(metrics.component, [])
+        n = len(history)
+        # More history → higher confidence, asymptotic to 0.95
+        return min(0.95, 0.5 + 0.45 * (1 - 1 / (1 + n / 10.0)))
diff --git a/agentic-aiops/automation/chaos_engineering.py b/agentic-aiops/automation/chaos_engineering.py
new file mode 100644
index 0000000..15cf6f1
--- /dev/null
+++ b/agentic-aiops/automation/chaos_engineering.py
@@ -0,0 +1,357 @@
+"""Chaos engineering framework for resilience testing via controlled failure injection."""
+
+from __future__ import annotations
+
+import asyncio
+import uuid
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any, Callable, Awaitable
+
+import numpy as np
+from loguru import logger
+
+
+class ExperimentType(Enum):
+    """Categories of chaos experiment."""
+
+    LATENCY_INJECTION = auto()
+    ERROR_INJECTION = auto()
+    CPU_STRESS = auto()
+    MEMORY_STRESS = auto()
+    NETWORK_PARTITION = auto()
+    PROCESS_KILL = auto()
+    DISK_FILL = auto()
+
+
+class ExperimentStatus(Enum):
+    """Lifecycle states of a chaos experiment."""
+
+    PENDING = auto()
+    RUNNING = auto()
+    COMPLETED = auto()
+    ABORTED = auto()
+    FAILED = auto()
+
+
+@dataclass
+class ChaosExperiment:
+    """Specification for a chaos engineering experiment.
+
+    Attributes:
+        experiment_id: Unique identifier.
+        name: Human-readable name.
+        experiment_type: Category of failure to inject.
+        target_component: Service or component under test.
+        blast_radius: Fraction of traffic/instances affected (0–1).
+        duration_seconds: How long to sustain the failure.
+        parameters: Type-specific parameters (e.g. latency_ms, error_rate).
+        hypothesis: Expected system behaviour under this failure.
+        abort_conditions: Metric conditions that trigger experiment abort.
+    """
+
+    experiment_id: str
+    name: str
+    experiment_type: ExperimentType
+    target_component: str
+    blast_radius: float
+    duration_seconds: float
+    parameters: dict[str, Any] = field(default_factory=dict)
+    hypothesis: str = ""
+    abort_conditions: dict[str, float] = field(default_factory=dict)
+
+
+@dataclass
+class ExperimentResult:
+    """Outcome of a chaos experiment.
+
+    Attributes:
+        experiment_id: Owning experiment identifier.
+        status: Final experiment status.
+        hypothesis_validated: Whether the hypothesis held under failure.
+        observations: Key metric observations during the experiment.
+        abort_reason: Reason for abort if status is ABORTED.
+        started_at: UTC start timestamp.
+        completed_at: UTC completion timestamp.
+        duration_ms: Actual experiment duration.
+    """
+
+    experiment_id: str
+    status: ExperimentStatus
+    hypothesis_validated: bool
+    observations: dict[str, Any]
+    abort_reason: str = ""
+    started_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    completed_at: datetime | None = None
+    duration_ms: float = 0.0
+
+
+class ChaosEngineering:
+    """Resilience testing framework with controlled failure injection.
+
+    Implements the chaos engineering principles: define steady state,
+    hypothesise, inject failure, observe, validate.
+
+    Attributes:
+        experiments: Registered experiments keyed by ID.
+        results: Completed experiment results.
+        _abort_callbacks: Optional callbacks invoked on abort conditions.
+        _steady_state_metrics: Baseline metrics for comparison.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the chaos engineering framework."""
+        self.experiments: dict[str, ChaosExperiment] = {}
+        self.results: list[ExperimentResult] = []
+        self._steady_state_metrics: dict[str, float] = {}
+        logger.info("ChaosEngineering framework initialised")
+
+    def define_steady_state(self, metrics: dict[str, float]) -> None:
+        """Define the system steady state for hypothesis validation.
+
+        Args:
+            metrics: Mapping of metric name to acceptable baseline value.
+        """
+        self._steady_state_metrics = dict(metrics)
+        logger.info("Steady state defined: {}", metrics)
+
+    def create_experiment(
+        self,
+        name: str,
+        experiment_type: ExperimentType,
+        target_component: str,
+        blast_radius: float = 0.1,
+        duration_seconds: float = 60.0,
+        parameters: dict[str, Any] | None = None,
+        hypothesis: str = "",
+        abort_conditions: dict[str, float] | None = None,
+    ) -> ChaosExperiment:
+        """Create and register a chaos experiment.
+
+        Args:
+            name: Experiment name.
+            experiment_type: Type of failure to inject.
+            target_component: Target service.
+            blast_radius: Fraction of instances/traffic affected (0–1).
+            duration_seconds: Experiment duration.
+            parameters: Type-specific parameters.
+            hypothesis: Expected behaviour description.
+            abort_conditions: Metric thresholds that trigger abort.
+
+        Returns:
+            The created :class:`ChaosExperiment`.
+
+        Raises:
+            ValueError: If ``blast_radius`` is not in (0, 1].
+        """
+        if not 0 < blast_radius <= 1.0:
+            raise ValueError(f"blast_radius must be in (0, 1], got {blast_radius}")
+
+        experiment_id = str(uuid.uuid4())
+        experiment = ChaosExperiment(
+            experiment_id=experiment_id,
+            name=name,
+            experiment_type=experiment_type,
+            target_component=target_component,
+            blast_radius=blast_radius,
+            duration_seconds=duration_seconds,
+            parameters=parameters or {},
+            hypothesis=hypothesis,
+            abort_conditions=abort_conditions or {},
+        )
+        self.experiments[experiment_id] = experiment
+        logger.info(
+            "Chaos experiment '{}' created (id={}, type={}, radius={:.0%})",
+            name,
+            experiment_id,
+            experiment_type.name,
+            blast_radius,
+        )
+        return experiment
+
+    async def run_experiment(
+        self,
+        experiment_id: str,
+        metric_collector: Callable[[], Awaitable[dict[str, float]]] | None = None,
+    ) -> ExperimentResult:
+        """Execute a chaos experiment with monitoring and auto-abort.
+
+        Args:
+            experiment_id: Experiment to run.
+            metric_collector: Async callable returning live metrics during
+                the experiment.  Uses a simulator when ``None``.
+
+        Returns:
+            :class:`ExperimentResult` with observations and outcome.
+
+        Raises:
+            KeyError: If ``experiment_id`` is not found.
+        """
+        experiment = self._get_experiment(experiment_id)
+        import time
+        start_ts = datetime.now(timezone.utc)
+        start_mono = time.monotonic()
+
+        logger.warning(
+            "CHAOS: Starting '{}' on '{}' ({:.0%} blast radius, {}s)",
+            experiment.name,
+            experiment.target_component,
+            experiment.blast_radius,
+            experiment.duration_seconds,
+        )
+
+        observations: dict[str, Any] = {
+            "experiment_type": experiment.experiment_type.name,
+            "target": experiment.target_component,
+            "blast_radius": experiment.blast_radius,
+            "metric_samples": [],
+        }
+        status = ExperimentStatus.COMPLETED
+        abort_reason = ""
+
+        try:
+            await self._inject_failure(experiment)
+            collector = metric_collector or self._default_metric_collector
+            n_samples = max(3, int(experiment.duration_seconds / 10))
+
+            for _ in range(n_samples):
+                await asyncio.sleep(0)
+                live_metrics = await collector()
+                observations["metric_samples"].append(live_metrics)
+
+                # Check abort conditions
+                abort_triggered, abort_reason = self._check_abort(
+                    live_metrics, experiment.abort_conditions
+                )
+                if abort_triggered:
+                    status = ExperimentStatus.ABORTED
+                    logger.error("Experiment aborted: {}", abort_reason)
+                    break
+
+            await self._remove_failure(experiment)
+
+        except Exception as exc:
+            status = ExperimentStatus.FAILED
+            abort_reason = str(exc)
+            logger.exception("Chaos experiment '{}' failed: {}", experiment_id, exc)
+
+        duration_ms = (time.monotonic() - start_mono) * 1000
+        hypothesis_validated = status == ExperimentStatus.COMPLETED and self._validate_hypothesis(
+            observations
+        )
+
+        result = ExperimentResult(
+            experiment_id=experiment_id,
+            status=status,
+            hypothesis_validated=hypothesis_validated,
+            observations=observations,
+            abort_reason=abort_reason,
+            started_at=start_ts,
+            completed_at=datetime.now(timezone.utc),
+            duration_ms=round(duration_ms, 2),
+        )
+        self.results.append(result)
+        logger.info(
+            "Chaos experiment '{}' completed: status={}, hypothesis_validated={}",
+            experiment_id,
+            status.name,
+            hypothesis_validated,
+        )
+        return result
+
+    async def _inject_failure(self, experiment: ChaosExperiment) -> None:
+        """Simulate failure injection for an experiment type.
+
+        Args:
+            experiment: Experiment specification.
+        """
+        await asyncio.sleep(0)
+        logger.debug(
+            "Injecting {} into '{}'", experiment.experiment_type.name, experiment.target_component
+        )
+
+    async def _remove_failure(self, experiment: ChaosExperiment) -> None:
+        """Simulate failure removal (restore steady state).
+
+        Args:
+            experiment: Experiment specification.
+        """
+        await asyncio.sleep(0)
+        logger.debug(
+            "Removing {} from '{}'", experiment.experiment_type.name, experiment.target_component
+        )
+
+    async def _default_metric_collector(self) -> dict[str, float]:
+        """Collect simulated metrics during an experiment.
+
+        Returns:
+            Dictionary of simulated metric readings.
+        """
+        await asyncio.sleep(0)
+        rng = np.random.default_rng()
+        return {
+            "error_rate": float(rng.beta(2, 20)),
+            "latency_p99_ms": float(rng.lognormal(5.0, 0.8)),
+            "cpu_percent": float(rng.uniform(40, 90)),
+            "availability": float(rng.uniform(0.95, 1.0)),
+        }
+
+    def _check_abort(
+        self,
+        metrics: dict[str, float],
+        abort_conditions: dict[str, float],
+    ) -> tuple[bool, str]:
+        """Check whether any abort condition is breached.
+
+        Args:
+            metrics: Current metric readings.
+            abort_conditions: Threshold mapping (abort if metric > threshold).
+
+        Returns:
+            Tuple of ``(should_abort, reason)``.
+        """
+        for metric, threshold in abort_conditions.items():
+            value = metrics.get(metric)
+            if value is not None and value > threshold:
+                return True, f"{metric}={value:.4f} > abort threshold {threshold}"
+        return False, ""
+
+    def _validate_hypothesis(self, observations: dict[str, Any]) -> bool:
+        """Validate the experiment hypothesis against steady state.
+
+        Args:
+            observations: Collected observations.
+
+        Returns:
+            ``True`` if steady state was maintained (hypothesis validated).
+        """
+        if not self._steady_state_metrics or not observations.get("metric_samples"):
+            return True  # Cannot disprove
+
+        samples = observations["metric_samples"]
+        for metric, baseline in self._steady_state_metrics.items():
+            values = [s.get(metric) for s in samples if metric in s]
+            if not values:
+                continue
+            mean_value = float(np.mean(values))
+            # Fail if mean deviates more than 50% from baseline
+            if abs(mean_value - baseline) / (abs(baseline) + 1e-10) > 0.5:
+                return False
+        return True
+
+    def _get_experiment(self, experiment_id: str) -> ChaosExperiment:
+        """Retrieve an experiment by ID.
+
+        Args:
+            experiment_id: Experiment identifier.
+
+        Returns:
+            The :class:`ChaosExperiment`.
+
+        Raises:
+            KeyError: If not found.
+        """
+        if experiment_id not in self.experiments:
+            raise KeyError(f"Experiment '{experiment_id}' not found")
+        return self.experiments[experiment_id]
diff --git a/agentic-aiops/automation/incident_response.py b/agentic-aiops/automation/incident_response.py
new file mode 100644
index 0000000..355cdb5
--- /dev/null
+++ b/agentic-aiops/automation/incident_response.py
@@ -0,0 +1,294 @@
+"""Automated incident response with severity classification and runbook execution."""
+
+from __future__ import annotations
+
+import asyncio
+import uuid
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class Severity(Enum):
+    """Incident severity levels aligned with SRE practices."""
+
+    SEV1 = 1  # Critical: complete service outage
+    SEV2 = 2  # High: major functionality impaired
+    SEV3 = 3  # Medium: degraded performance
+    SEV4 = 4  # Low: minor issue, workaround available
+    SEV5 = 5  # Informational
+
+
+class IncidentStatus(Enum):
+    """Lifecycle status of an incident."""
+
+    OPEN = auto()
+    INVESTIGATING = auto()
+    MITIGATING = auto()
+    RESOLVED = auto()
+    POSTMORTEM = auto()
+
+
+@dataclass
+class Incident:
+    """A detected or declared operational incident.
+
+    Attributes:
+        incident_id: Unique identifier (auto-generated).
+        title: Short description.
+        description: Detailed incident description.
+        severity: Classified severity level.
+        affected_components: List of impacted service components.
+        status: Current lifecycle status.
+        created_at: UTC creation timestamp.
+        resolved_at: UTC resolution timestamp (set on resolution).
+        runbook_steps: Ordered list of response steps to execute.
+        timeline: Ordered list of timestamped event strings.
+        metadata: Arbitrary additional context.
+    """
+
+    incident_id: str
+    title: str
+    description: str
+    severity: Severity
+    affected_components: list[str]
+    status: IncidentStatus = IncidentStatus.OPEN
+    created_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    resolved_at: datetime | None = None
+    runbook_steps: list[str] = field(default_factory=list)
+    timeline: list[str] = field(default_factory=list)
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+@dataclass
+class RunbookExecution:
+    """Result of executing a single runbook step.
+
+    Attributes:
+        step: Step description.
+        success: Whether execution succeeded.
+        output: Execution output or error message.
+        duration_ms: Execution time in milliseconds.
+    """
+
+    step: str
+    success: bool
+    output: str
+    duration_ms: float
+
+
+class IncidentResponse:
+    """Automated incident handling with severity classification and runbook execution.
+
+    Attributes:
+        incidents: All incidents keyed by incident_id.
+        _runbooks: Severity-to-runbook step mapping.
+    """
+
+    _SEVERITY_RUNBOOKS: dict[Severity, list[str]] = {
+        Severity.SEV1: [
+            "page_on_call_engineer",
+            "open_war_room",
+            "activate_incident_commander",
+            "notify_executive_stakeholders",
+            "enable_circuit_breakers",
+            "failover_to_backup_region",
+            "validate_failover",
+            "update_status_page",
+            "conduct_postmortem",
+        ],
+        Severity.SEV2: [
+            "notify_on_call_team",
+            "diagnose_root_cause",
+            "apply_remediation",
+            "validate_fix",
+            "update_status_page",
+            "schedule_postmortem",
+        ],
+        Severity.SEV3: [
+            "notify_team_channel",
+            "investigate_degradation",
+            "apply_workaround",
+            "monitor_for_improvement",
+        ],
+        Severity.SEV4: [
+            "log_ticket",
+            "schedule_investigation",
+        ],
+        Severity.SEV5: [
+            "log_for_awareness",
+        ],
+    }
+
+    def __init__(self) -> None:
+        """Initialise the incident response system."""
+        self.incidents: dict[str, Incident] = {}
+        logger.info("IncidentResponse initialised")
+
+    def classify_severity(
+        self,
+        error_rate: float,
+        affected_user_pct: float,
+        latency_p99_ms: float,
+        data_loss: bool = False,
+    ) -> Severity:
+        """Classify incident severity from operational metrics.
+
+        Args:
+            error_rate: Fraction of requests failing (0–1).
+            affected_user_pct: Percentage of users affected (0–100).
+            latency_p99_ms: 99th percentile latency in milliseconds.
+            data_loss: Whether data loss has occurred.
+
+        Returns:
+            Classified :class:`Severity` level.
+        """
+        if data_loss or error_rate > 0.5 or affected_user_pct > 50:
+            return Severity.SEV1
+        if error_rate > 0.2 or affected_user_pct > 20 or latency_p99_ms > 5000:
+            return Severity.SEV2
+        if error_rate > 0.05 or affected_user_pct > 5 or latency_p99_ms > 2000:
+            return Severity.SEV3
+        if error_rate > 0.01 or latency_p99_ms > 1000:
+            return Severity.SEV4
+        return Severity.SEV5
+
+    def create_incident(
+        self,
+        title: str,
+        description: str,
+        severity: Severity,
+        affected_components: list[str],
+        metadata: dict[str, Any] | None = None,
+    ) -> Incident:
+        """Create and register a new incident.
+
+        Args:
+            title: Short incident title.
+            description: Detailed description.
+            severity: Classified severity.
+            affected_components: List of impacted components.
+            metadata: Optional additional context.
+
+        Returns:
+            The newly created :class:`Incident`.
+        """
+        incident_id = f"INC-{uuid.uuid4().hex[:8].upper()}"
+        runbook = self._SEVERITY_RUNBOOKS.get(severity, ["investigate_manually"])
+        incident = Incident(
+            incident_id=incident_id,
+            title=title,
+            description=description,
+            severity=severity,
+            affected_components=affected_components,
+            runbook_steps=list(runbook),
+            timeline=[f"[{datetime.now(timezone.utc).isoformat()}] Incident created"],
+            metadata=metadata or {},
+        )
+        self.incidents[incident_id] = incident
+        logger.warning(
+            "Incident {} created: [{}] {} ({})",
+            incident_id,
+            severity.name,
+            title,
+            affected_components,
+        )
+        return incident
+
+    async def execute_runbook(self, incident_id: str) -> list[RunbookExecution]:
+        """Execute the runbook associated with an incident.
+
+        Args:
+            incident_id: Incident to execute runbook for.
+
+        Returns:
+            List of :class:`RunbookExecution` results for each step.
+
+        Raises:
+            KeyError: If ``incident_id`` is not found.
+        """
+        incident = self._get_incident(incident_id)
+        incident.status = IncidentStatus.MITIGATING
+        results: list[RunbookExecution] = []
+
+        logger.info(
+            "Executing runbook for {} ({} steps): {}",
+            incident_id,
+            len(incident.runbook_steps),
+            incident.severity.name,
+        )
+
+        for step in incident.runbook_steps:
+            result = await self._execute_step(step)
+            results.append(result)
+            ts = datetime.now(timezone.utc).isoformat()
+            status_str = "OK" if result.success else "FAILED"
+            incident.timeline.append(f"[{ts}] {step}: {status_str}")
+            logger.debug("Runbook step '{}': {} ({:.1f}ms)", step, status_str, result.duration_ms)
+
+        return results
+
+    async def resolve(self, incident_id: str, resolution_note: str = "") -> Incident:
+        """Mark an incident as resolved.
+
+        Args:
+            incident_id: Incident to resolve.
+            resolution_note: Optional resolution description.
+
+        Returns:
+            Updated :class:`Incident`.
+
+        Raises:
+            KeyError: If not found.
+        """
+        incident = self._get_incident(incident_id)
+        incident.status = IncidentStatus.RESOLVED
+        incident.resolved_at = datetime.now(timezone.utc)
+        ts = incident.resolved_at.isoformat()
+        incident.timeline.append(f"[{ts}] Resolved: {resolution_note or 'no note'}")
+        logger.info("Incident {} resolved", incident_id)
+        return incident
+
+    async def _execute_step(self, step: str) -> RunbookExecution:
+        """Simulate execution of a runbook step.
+
+        Args:
+            step: Step description.
+
+        Returns:
+            Execution result.
+        """
+        import time
+        start = time.monotonic()
+        await asyncio.sleep(0)
+        duration_ms = (time.monotonic() - start) * 1000
+
+        rng = np.random.default_rng(seed=hash(step) % (2**32))
+        success = rng.random() > 0.1  # 90% success rate
+        output = f"Step '{step}' {'completed successfully' if success else 'encountered an error'}"
+        return RunbookExecution(
+            step=step,
+            success=success,
+            output=output,
+            duration_ms=round(duration_ms * 1000, 2),
+        )
+
+    def _get_incident(self, incident_id: str) -> Incident:
+        """Retrieve an incident by ID.
+
+        Args:
+            incident_id: Incident identifier.
+
+        Returns:
+            The :class:`Incident`.
+
+        Raises:
+            KeyError: If not found.
+        """
+        if incident_id not in self.incidents:
+            raise KeyError(f"Incident '{incident_id}' not found")
+        return self.incidents[incident_id]
diff --git a/agi-orchestrator/__init__.py b/agi-orchestrator/__init__.py
new file mode 100644
index 0000000..ce9320c
--- /dev/null
+++ b/agi-orchestrator/__init__.py
@@ -0,0 +1,83 @@
+"""AGI Orchestrator package for the trading platform.
+
+Provides the top-level AGIOrchestrator that wires together the decision engine,
+global state manager, goal hierarchy, self-improvement loops, reasoning modules,
+and multi-agent coordination into a single coherent runtime.
+"""
+
+from coordination.agent_coordinator import AgentCoordinator
+from coordination.conflict_resolver import ConflictResolver
+from coordination.resource_allocator import ResourceAllocator
+from core.decision_engine import AGIDecisionEngine
+from core.global_state_manager import GlobalStateManager
+from core.goal_hierarchy import GoalHierarchy
+from core.self_improvement import SelfImprovement
+from reasoning.causal_inference import CausalInferenceEngine
+from reasoning.meta_cognitive import MetaCognitive
+from reasoning.strategic_planner import StrategicPlanner
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+
+class AGIOrchestrator:
+    """Top-level AGI orchestrator for the trading platform.
+
+    Wires together all sub-systems (decision engine, goal hierarchy, reasoning,
+    coordination) and exposes a unified async lifecycle interface.
+
+    Attributes:
+        state_manager: System-wide shared state store.
+        goal_hierarchy: Multi-objective goal tracker.
+        decision_engine: Meta-learning decision maker.
+        self_improvement: Autonomous performance-improvement loop.
+        causal_engine: Causal inference reasoner.
+        strategic_planner: Long-horizon strategy builder.
+        meta_cognitive: Self-reflection and confidence assessor.
+        agent_coordinator: Multi-agent lifecycle manager.
+        resource_allocator: Dynamic resource budget manager.
+        conflict_resolver: Inter-system conflict mediator.
+    """
+
+    def __init__(self, config: dict | None = None) -> None:
+        """Initialise all sub-systems with an optional configuration mapping.
+
+        Args:
+            config: Optional key-value configuration overrides forwarded to
+                each sub-system during initialisation.
+        """
+        cfg = config or {}
+        self.state_manager = GlobalStateManager()
+        self.goal_hierarchy = GoalHierarchy()
+        self.decision_engine = AGIDecisionEngine(state_manager=self.state_manager)
+        self.self_improvement = SelfImprovement()
+        self.causal_engine = CausalInferenceEngine()
+        self.strategic_planner = StrategicPlanner()
+        self.meta_cognitive = MetaCognitive()
+        self.agent_coordinator = AgentCoordinator(state_manager=self.state_manager)
+        self.resource_allocator = ResourceAllocator()
+        self.conflict_resolver = ConflictResolver()
+        log.info("AGIOrchestrator initialised", config_keys=list(cfg.keys()))
+
+    async def start(self) -> None:
+        """Start all async sub-systems in the correct dependency order.
+
+        Raises:
+            RuntimeError: If any sub-system fails to start.
+        """
+        log.info("AGIOrchestrator starting")
+        await self.state_manager.update_state("orchestrator_status", "running")
+        log.info("AGIOrchestrator running")
+
+    async def stop(self) -> None:
+        """Gracefully shut down all sub-systems.
+
+        Raises:
+            RuntimeError: If any sub-system fails during shutdown.
+        """
+        log.info("AGIOrchestrator stopping")
+        await self.state_manager.update_state("orchestrator_status", "stopped")
+        log.info("AGIOrchestrator stopped")
+
+
+__all__ = ["AGIOrchestrator"]
diff --git a/agi-orchestrator/__pycache__/__init__.cpython-312.pyc b/agi-orchestrator/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..eeac7e1
Binary files /dev/null and b/agi-orchestrator/__pycache__/__init__.cpython-312.pyc differ
diff --git a/agi-orchestrator/coordination/__init__.py b/agi-orchestrator/coordination/__init__.py
new file mode 100644
index 0000000..165e466
--- /dev/null
+++ b/agi-orchestrator/coordination/__init__.py
@@ -0,0 +1 @@
+# AGI Orchestrator – coordination sub-package
diff --git a/agi-orchestrator/coordination/__pycache__/__init__.cpython-312.pyc b/agi-orchestrator/coordination/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..e852c34
Binary files /dev/null and b/agi-orchestrator/coordination/__pycache__/__init__.cpython-312.pyc differ
diff --git a/agi-orchestrator/coordination/__pycache__/agent_coordinator.cpython-312.pyc b/agi-orchestrator/coordination/__pycache__/agent_coordinator.cpython-312.pyc
new file mode 100644
index 0000000..f9b0fc5
Binary files /dev/null and b/agi-orchestrator/coordination/__pycache__/agent_coordinator.cpython-312.pyc differ
diff --git a/agi-orchestrator/coordination/__pycache__/conflict_resolver.cpython-312.pyc b/agi-orchestrator/coordination/__pycache__/conflict_resolver.cpython-312.pyc
new file mode 100644
index 0000000..3a62b98
Binary files /dev/null and b/agi-orchestrator/coordination/__pycache__/conflict_resolver.cpython-312.pyc differ
diff --git a/agi-orchestrator/coordination/__pycache__/resource_allocator.cpython-312.pyc b/agi-orchestrator/coordination/__pycache__/resource_allocator.cpython-312.pyc
new file mode 100644
index 0000000..6176b81
Binary files /dev/null and b/agi-orchestrator/coordination/__pycache__/resource_allocator.cpython-312.pyc differ
diff --git a/agi-orchestrator/coordination/agent_coordinator.py b/agi-orchestrator/coordination/agent_coordinator.py
new file mode 100644
index 0000000..e52e860
--- /dev/null
+++ b/agi-orchestrator/coordination/agent_coordinator.py
@@ -0,0 +1,162 @@
+"""Agent Coordinator – multi-agent lifecycle management and orchestration.
+
+Maintains a registry of active agents, routes work to them, and provides a
+broadcast mechanism for publishing state updates to all registered agents.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from typing import Any, Callable, Coroutine
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+# Type alias for async agent handler.
+AgentHandler = Callable[[dict[str, Any]], Coroutine[Any, Any, Any]]
+
+
+@dataclass
+class AgentRegistration:
+    """Metadata for a registered agent.
+
+    Attributes:
+        agent_id: Unique identifier for the agent.
+        name: Human-readable name.
+        capabilities: List of capability tags (e.g. ``["trade", "risk"]``).
+        handler: Async callable that processes task payloads.
+        metadata: Arbitrary extra attributes.
+    """
+
+    agent_id: str
+    name: str
+    capabilities: list[str] = field(default_factory=list)
+    handler: AgentHandler | None = field(default=None, repr=False)
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+class AgentCoordinator:
+    """Multi-agent orchestrator supporting registration, coordination, and broadcast.
+
+    Attributes:
+        state_manager: Optional shared :class:`GlobalStateManager`.
+        _agents: Registry mapping agent IDs to :class:`AgentRegistration`.
+    """
+
+    def __init__(self, state_manager: Any | None = None) -> None:
+        """Initialise the coordinator.
+
+        Args:
+            state_manager: Optional shared state store for reporting.
+        """
+        self.state_manager = state_manager
+        self._agents: dict[str, AgentRegistration] = {}
+        log.info("AgentCoordinator initialised")
+
+    def register_agent(self, registration: AgentRegistration) -> str:
+        """Add an agent to the coordinator's registry.
+
+        Args:
+            registration: :class:`AgentRegistration` describing the agent.
+
+        Returns:
+            The ``agent_id`` of the registered agent.
+
+        Raises:
+            ValueError: If an agent with the same ``agent_id`` is already registered.
+        """
+        if registration.agent_id in self._agents:
+            raise ValueError(f"Agent '{registration.agent_id}' is already registered")
+        self._agents[registration.agent_id] = registration
+        log.info(
+            "Agent registered",
+            agent_id=registration.agent_id,
+            name=registration.name,
+            capabilities=registration.capabilities,
+        )
+        return registration.agent_id
+
+    async def coordinate(
+        self,
+        task: dict[str, Any],
+        required_capability: str | None = None,
+    ) -> list[Any]:
+        """Route *task* to all agents that possess the required capability.
+
+        When *required_capability* is *None* the task is sent to every
+        registered agent.  Tasks are dispatched concurrently via
+        :func:`asyncio.gather`.
+
+        Args:
+            task: Payload dict forwarded to each matching agent's handler.
+            required_capability: Optional capability filter.
+
+        Returns:
+            List of results returned by each agent's handler (in no guaranteed
+            order).
+
+        Raises:
+            RuntimeError: If no agents match the requested capability.
+        """
+        targets = [
+            reg
+            for reg in self._agents.values()
+            if required_capability is None or required_capability in reg.capabilities
+        ]
+        if not targets:
+            raise RuntimeError(
+                f"No agents available for capability '{required_capability}'"
+            )
+
+        log.info(
+            "Coordinating task",
+            capability=required_capability,
+            agent_count=len(targets),
+        )
+
+        async def _dispatch(reg: AgentRegistration) -> Any:
+            if reg.handler is None:
+                log.warning("Agent has no handler", agent_id=reg.agent_id)
+                return None
+            try:
+                return await reg.handler(task)
+            except Exception as exc:  # noqa: BLE001
+                log.error("Agent handler error", agent_id=reg.agent_id, error=str(exc))
+                return None
+
+        results = await asyncio.gather(*(_dispatch(r) for r in targets))
+        return list(results)
+
+    async def broadcast(self, message: dict[str, Any]) -> int:
+        """Send *message* to every registered agent's handler in parallel.
+
+        Args:
+            message: Payload broadcast to all agents.
+
+        Returns:
+            Number of agents that received the message (handler not *None*).
+        """
+        recipients = [r for r in self._agents.values() if r.handler is not None]
+        if not recipients:
+            log.debug("Broadcast skipped – no handlers registered")
+            return 0
+
+        async def _send(reg: AgentRegistration) -> None:
+            try:
+                await reg.handler(message)  # type: ignore[misc]
+            except Exception as exc:  # noqa: BLE001
+                log.error("Broadcast handler error", agent_id=reg.agent_id, error=str(exc))
+
+        await asyncio.gather(*(_send(r) for r in recipients))
+        log.info("Broadcast sent", recipient_count=len(recipients))
+        return len(recipients)
+
+    def list_agents(self) -> list[AgentRegistration]:
+        """Return a snapshot of all currently registered agents.
+
+        Returns:
+            List of :class:`AgentRegistration` objects.
+        """
+        return list(self._agents.values())
diff --git a/agi-orchestrator/coordination/conflict_resolver.py b/agi-orchestrator/coordination/conflict_resolver.py
new file mode 100644
index 0000000..cdc1907
--- /dev/null
+++ b/agi-orchestrator/coordination/conflict_resolver.py
@@ -0,0 +1,177 @@
+"""Conflict Resolver – inter-system conflict detection and resolution.
+
+When multiple sub-systems issue contradictory directives (e.g. one agent
+wants to buy while another wants to sell the same asset), the resolver
+detects the conflict, applies an arbitration policy, and returns a
+resolved directive.
+"""
+
+from __future__ import annotations
+
+import uuid
+from dataclasses import dataclass, field
+from enum import Enum, auto
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+
+class ConflictType(Enum):
+    """Classification of detected conflicts."""
+
+    DIRECTIONAL = auto()    # Opposing buy/sell signals.
+    RESOURCE = auto()       # Over-subscription of a shared resource.
+    PRIORITY = auto()       # Competing goals at the same priority level.
+    TEMPORAL = auto()       # Time-window overlaps in scheduled actions.
+    UNKNOWN = auto()
+
+
+@dataclass
+class Conflict:
+    """A detected inter-system conflict.
+
+    Attributes:
+        conflict_id: Unique identifier, auto-generated.
+        conflict_type: Classification of the conflict.
+        parties: List of agent/system IDs involved.
+        directives: The contradictory directives that caused the conflict.
+        severity: Numeric severity in ``[0.0, 1.0]``.
+        resolved: Whether a resolution has been applied.
+        resolution: The chosen resolution directive (populated by :meth:`resolve`).
+    """
+
+    conflict_id: str = field(default_factory=lambda: str(uuid.uuid4()))
+    conflict_type: ConflictType = ConflictType.UNKNOWN
+    parties: list[str] = field(default_factory=list)
+    directives: list[dict[str, Any]] = field(default_factory=list)
+    severity: float = 0.5
+    resolved: bool = False
+    resolution: dict[str, Any] = field(default_factory=dict)
+
+
+class ConflictResolver:
+    """Detects, resolves, and arbitrates inter-system conflicts.
+
+    Attributes:
+        _conflicts: History of all detected conflicts keyed by ``conflict_id``.
+        _arbitration_policy: Strategy used when automatic resolution fails.
+    """
+
+    def __init__(self, arbitration_policy: str = "priority") -> None:
+        """Initialise the resolver with an arbitration policy.
+
+        Args:
+            arbitration_policy: Strategy for tie-breaking. Supported values:
+                ``"priority"`` (higher-priority directive wins) and
+                ``"conservative"`` (least-aggressive directive wins).
+        """
+        if arbitration_policy not in {"priority", "conservative"}:
+            raise ValueError(
+                f"Unknown arbitration_policy '{arbitration_policy}'. "
+                "Choose 'priority' or 'conservative'."
+            )
+        self._conflicts: dict[str, Conflict] = {}
+        self._arbitration_policy = arbitration_policy
+        log.info("ConflictResolver initialised", policy=arbitration_policy)
+
+    def detect_conflict(self, directives: list[dict[str, Any]]) -> Conflict | None:
+        """Analyse a set of directives and return a :class:`Conflict` if found.
+
+        A directional conflict is detected when two directives target the same
+        asset with opposing actions (``"buy"`` vs ``"sell"``).
+
+        Args:
+            directives: List of directive dicts, each containing at minimum
+                ``action`` and optionally ``asset`` and ``agent_id`` keys.
+
+        Returns:
+            A new :class:`Conflict` if one is found, otherwise *None*.
+        """
+        if len(directives) < 2:
+            return None
+
+        # Build action map per asset.
+        asset_actions: dict[str, list[dict[str, Any]]] = {}
+        for d in directives:
+            asset = d.get("asset", "global")
+            asset_actions.setdefault(asset, []).append(d)
+
+        for asset, asset_directives in asset_actions.items():
+            actions = {d.get("action", "").lower() for d in asset_directives}
+            if "buy" in actions and "sell" in actions:
+                parties = [d.get("agent_id", "unknown") for d in asset_directives]
+                conflict = Conflict(
+                    conflict_type=ConflictType.DIRECTIONAL,
+                    parties=parties,
+                    directives=asset_directives,
+                    severity=0.8,
+                )
+                self._conflicts[conflict.conflict_id] = conflict
+                log.warning(
+                    "Conflict detected",
+                    conflict_id=conflict.conflict_id,
+                    conflict_type=conflict.conflict_type.name,
+                    asset=asset,
+                    parties=parties,
+                )
+                return conflict
+
+        return None
+
+    def resolve(self, conflict: Conflict) -> dict[str, Any]:
+        """Apply automatic resolution logic to a detected conflict.
+
+        Args:
+            conflict: The :class:`Conflict` to resolve.
+
+        Returns:
+            The chosen resolution directive dict.
+        """
+        if conflict.resolved:
+            log.debug("Conflict already resolved", conflict_id=conflict.conflict_id)
+            return conflict.resolution
+
+        resolution = self.arbitrate(conflict)
+        conflict.resolution = resolution
+        conflict.resolved = True
+        log.info(
+            "Conflict resolved",
+            conflict_id=conflict.conflict_id,
+            resolution_action=resolution.get("action"),
+        )
+        return resolution
+
+    def arbitrate(self, conflict: Conflict) -> dict[str, Any]:
+        """Apply the configured arbitration policy to select a winning directive.
+
+        Args:
+            conflict: The :class:`Conflict` being arbitrated.
+
+        Returns:
+            The winning directive dict according to the policy.
+        """
+        if not conflict.directives:
+            return {"action": "hold", "reason": "no directives to arbitrate"}
+
+        if self._arbitration_policy == "priority":
+            # Directive with the highest ``priority`` value wins.
+            winner = max(
+                conflict.directives,
+                key=lambda d: float(d.get("priority", 0.0)),
+            )
+        else:  # conservative
+            # Directive with the least-aggressive action wins (hold > buy > sell).
+            aggression = {"hold": 0, "buy": 1, "sell": 1, "short": 2}
+            winner = min(
+                conflict.directives,
+                key=lambda d: aggression.get(d.get("action", "hold").lower(), 99),
+            )
+
+        log.info(
+            "Arbitration complete",
+            policy=self._arbitration_policy,
+            winning_action=winner.get("action"),
+        )
+        return dict(winner)
diff --git a/agi-orchestrator/coordination/resource_allocator.py b/agi-orchestrator/coordination/resource_allocator.py
new file mode 100644
index 0000000..36c8318
--- /dev/null
+++ b/agi-orchestrator/coordination/resource_allocator.py
@@ -0,0 +1,182 @@
+"""Resource Allocator – dynamic resource budget management.
+
+Tracks named resource pools (CPU, memory, API quota, …) and provides
+allocation/release semantics with utilisation reporting.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+
+@dataclass
+class ResourcePool:
+    """A named resource bucket with a fixed capacity.
+
+    Attributes:
+        name: Human-readable resource name (e.g. ``"cpu"``, ``"memory_gb"``).
+        capacity: Total available units.
+        allocated: Currently committed units.
+        metadata: Arbitrary tags.
+    """
+
+    name: str
+    capacity: float
+    allocated: float = 0.0
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+    @property
+    def available(self) -> float:
+        """Remaining unallocated units."""
+        return max(0.0, self.capacity - self.allocated)
+
+    @property
+    def utilisation(self) -> float:
+        """Fraction of capacity currently in use, in ``[0.0, 1.0]``."""
+        return self.allocated / self.capacity if self.capacity else 0.0
+
+
+@dataclass
+class Allocation:
+    """A recorded allocation ticket.
+
+    Attributes:
+        allocation_id: Unique ticket identifier.
+        resource_name: Name of the pool allocated from.
+        units: Number of units reserved.
+        owner: Agent or component that owns this allocation.
+    """
+
+    allocation_id: str
+    resource_name: str
+    units: float
+    owner: str = "unknown"
+
+
+class ResourceAllocator:
+    """Dynamic resource manager that tracks pools and outstanding allocations.
+
+    Attributes:
+        _pools: Registered resource pools keyed by name.
+        _allocations: Outstanding allocation tickets keyed by ``allocation_id``.
+    """
+
+    def __init__(self) -> None:
+        """Initialise with no pools and no outstanding allocations."""
+        self._pools: dict[str, ResourcePool] = {}
+        self._allocations: dict[str, Allocation] = {}
+        log.info("ResourceAllocator initialised")
+
+    def register_pool(self, name: str, capacity: float, metadata: dict[str, Any] | None = None) -> None:
+        """Register a new named resource pool.
+
+        Args:
+            name: Unique pool name.
+            capacity: Total available units.
+            metadata: Optional tags.
+
+        Raises:
+            ValueError: If *name* is already registered or *capacity* ≤ 0.
+        """
+        if name in self._pools:
+            raise ValueError(f"Pool '{name}' already registered")
+        if capacity <= 0:
+            raise ValueError(f"capacity must be positive, got {capacity}")
+        self._pools[name] = ResourcePool(name=name, capacity=capacity, metadata=metadata or {})
+        log.info("Resource pool registered", name=name, capacity=capacity)
+
+    def allocate(
+        self,
+        allocation_id: str,
+        resource_name: str,
+        units: float,
+        owner: str = "unknown",
+    ) -> Allocation:
+        """Reserve *units* from the named pool.
+
+        Args:
+            allocation_id: Unique ticket identifier chosen by the caller.
+            resource_name: Name of the pool to allocate from.
+            units: Number of units to reserve.
+            owner: Identifier of the requesting component.
+
+        Returns:
+            The created :class:`Allocation` ticket.
+
+        Raises:
+            KeyError: If *resource_name* is not registered.
+            ValueError: If insufficient capacity is available or *units* ≤ 0.
+        """
+        if resource_name not in self._pools:
+            raise KeyError(f"Resource pool '{resource_name}' not found")
+        if units <= 0:
+            raise ValueError(f"units must be positive, got {units}")
+
+        pool = self._pools[resource_name]
+        if units > pool.available:
+            raise ValueError(
+                f"Insufficient capacity: requested {units}, available {pool.available}"
+            )
+
+        pool.allocated += units
+        ticket = Allocation(
+            allocation_id=allocation_id,
+            resource_name=resource_name,
+            units=units,
+            owner=owner,
+        )
+        self._allocations[allocation_id] = ticket
+        log.info(
+            "Resources allocated",
+            allocation_id=allocation_id,
+            resource=resource_name,
+            units=units,
+            utilisation=f"{pool.utilisation:.1%}",
+        )
+        return ticket
+
+    def release(self, allocation_id: str) -> None:
+        """Return previously reserved units back to the pool.
+
+        Args:
+            allocation_id: Ticket identifier returned by :meth:`allocate`.
+
+        Raises:
+            KeyError: If *allocation_id* is not found.
+        """
+        if allocation_id not in self._allocations:
+            raise KeyError(f"Allocation '{allocation_id}' not found")
+
+        ticket = self._allocations.pop(allocation_id)
+        pool = self._pools[ticket.resource_name]
+        pool.allocated = max(0.0, pool.allocated - ticket.units)
+        log.info(
+            "Resources released",
+            allocation_id=allocation_id,
+            resource=ticket.resource_name,
+            units=ticket.units,
+        )
+
+    def get_utilization(self) -> dict[str, dict[str, float]]:
+        """Return a utilisation snapshot for every registered pool.
+
+        Returns:
+            Mapping of pool name → dict with ``capacity``, ``allocated``,
+            ``available``, and ``utilisation`` keys.
+        """
+        report = {
+            name: {
+                "capacity": pool.capacity,
+                "allocated": pool.allocated,
+                "available": pool.available,
+                "utilisation": pool.utilisation,
+            }
+            for name, pool in self._pools.items()
+        }
+        log.debug("Utilisation report generated", pools=list(report.keys()))
+        return report
diff --git a/agi-orchestrator/core/__init__.py b/agi-orchestrator/core/__init__.py
new file mode 100644
index 0000000..123cdca
--- /dev/null
+++ b/agi-orchestrator/core/__init__.py
@@ -0,0 +1 @@
+# AGI Orchestrator – core sub-package
diff --git a/agi-orchestrator/core/__pycache__/__init__.cpython-312.pyc b/agi-orchestrator/core/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..5ae3293
Binary files /dev/null and b/agi-orchestrator/core/__pycache__/__init__.cpython-312.pyc differ
diff --git a/agi-orchestrator/core/__pycache__/decision_engine.cpython-312.pyc b/agi-orchestrator/core/__pycache__/decision_engine.cpython-312.pyc
new file mode 100644
index 0000000..4cb04d4
Binary files /dev/null and b/agi-orchestrator/core/__pycache__/decision_engine.cpython-312.pyc differ
diff --git a/agi-orchestrator/core/__pycache__/global_state_manager.cpython-312.pyc b/agi-orchestrator/core/__pycache__/global_state_manager.cpython-312.pyc
new file mode 100644
index 0000000..de09373
Binary files /dev/null and b/agi-orchestrator/core/__pycache__/global_state_manager.cpython-312.pyc differ
diff --git a/agi-orchestrator/core/__pycache__/goal_hierarchy.cpython-312.pyc b/agi-orchestrator/core/__pycache__/goal_hierarchy.cpython-312.pyc
new file mode 100644
index 0000000..137b3f5
Binary files /dev/null and b/agi-orchestrator/core/__pycache__/goal_hierarchy.cpython-312.pyc differ
diff --git a/agi-orchestrator/core/__pycache__/self_improvement.cpython-312.pyc b/agi-orchestrator/core/__pycache__/self_improvement.cpython-312.pyc
new file mode 100644
index 0000000..c31895d
Binary files /dev/null and b/agi-orchestrator/core/__pycache__/self_improvement.cpython-312.pyc differ
diff --git a/agi-orchestrator/core/decision_engine.py b/agi-orchestrator/core/decision_engine.py
new file mode 100644
index 0000000..72f9fc5
--- /dev/null
+++ b/agi-orchestrator/core/decision_engine.py
@@ -0,0 +1,176 @@
+"""AGI Decision Engine – meta-learning multi-level decision maker.
+
+Decisions are grouped into three levels:
+
+* **Strategic** – long-horizon portfolio and regime decisions.
+* **Tactical** – medium-horizon allocation and entry/exit timing.
+* **Operational** – short-horizon execution and order management.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from enum import Enum, auto
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+
+class DecisionLevel(Enum):
+    """Granularity tier for a decision."""
+
+    STRATEGIC = auto()
+    TACTICAL = auto()
+    OPERATIONAL = auto()
+
+
+@dataclass
+class Signal:
+    """A single named signal with an associated numeric value and metadata.
+
+    Attributes:
+        name: Human-readable signal identifier.
+        value: Numeric magnitude of the signal.
+        source: Originating sub-system or agent.
+        metadata: Arbitrary extra key-value pairs.
+    """
+
+    name: str
+    value: float
+    source: str = "unknown"
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+@dataclass
+class Decision:
+    """An output decision produced by the engine.
+
+    Attributes:
+        level: The decision tier this belongs to.
+        action: Short action descriptor (e.g. ``"buy"``, ``"rebalance"``).
+        confidence: Probability-like confidence in [0, 1].
+        rationale: Human-readable explanation.
+        metadata: Arbitrary supporting data.
+    """
+
+    level: DecisionLevel
+    action: str
+    confidence: float
+    rationale: str = ""
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+class AGIDecisionEngine:
+    """Meta-learning decision maker with three-level decision architecture.
+
+    The engine processes raw signals, synthesises them into a unified view,
+    and produces decisions at strategic, tactical, and operational levels.
+
+    Attributes:
+        state_manager: Shared :class:`GlobalStateManager` instance (optional).
+        _signal_buffer: Accumulated signals awaiting processing.
+        _strategy_weights: Per-level numeric weight used during synthesis.
+    """
+
+    def __init__(self, state_manager: Any | None = None) -> None:
+        """Initialise the decision engine.
+
+        Args:
+            state_manager: Optional shared state store injected at runtime.
+        """
+        self.state_manager = state_manager
+        self._signal_buffer: list[Signal] = []
+        self._strategy_weights: dict[DecisionLevel, float] = {
+            DecisionLevel.STRATEGIC: 0.5,
+            DecisionLevel.TACTICAL: 0.3,
+            DecisionLevel.OPERATIONAL: 0.2,
+        }
+        log.info("AGIDecisionEngine initialised")
+
+    async def process_signals(self, signals: list[Signal]) -> None:
+        """Buffer incoming signals for the next decision cycle.
+
+        Args:
+            signals: List of :class:`Signal` objects to accumulate.
+
+        Raises:
+            TypeError: If *signals* is not a list.
+        """
+        if not isinstance(signals, list):
+            raise TypeError(f"signals must be a list, got {type(signals).__name__}")
+        self._signal_buffer.extend(signals)
+        log.debug("Buffered signals", count=len(signals), total=len(self._signal_buffer))
+
+    async def synthesize(self) -> dict[str, Any]:
+        """Aggregate the current signal buffer into a unified market view.
+
+        Clears the buffer after synthesis.
+
+        Returns:
+            A mapping with keys ``signal_count``, ``net_value``, and
+            ``sources`` summarising the buffered signals.
+        """
+        if not self._signal_buffer:
+            log.debug("synthesize called with empty buffer")
+            return {"signal_count": 0, "net_value": 0.0, "sources": []}
+
+        net_value = sum(s.value for s in self._signal_buffer)
+        sources = list({s.source for s in self._signal_buffer})
+        result = {
+            "signal_count": len(self._signal_buffer),
+            "net_value": net_value,
+            "sources": sources,
+        }
+        self._signal_buffer.clear()
+        log.debug("Synthesised signals", **result)
+        return result
+
+    async def make_decision(
+        self,
+        context: dict[str, Any],
+        level: DecisionLevel = DecisionLevel.TACTICAL,
+    ) -> Decision:
+        """Produce a decision for the requested level given the current context.
+
+        The method synthesises any buffered signals, then applies level-specific
+        heuristics to determine the best action and a confidence score.
+
+        Args:
+            context: Ambient information dict (e.g. market regime, portfolio
+                state) made available by the caller.
+            level: Decision tier to target. Defaults to
+                :attr:`DecisionLevel.TACTICAL`.
+
+        Returns:
+            A :class:`Decision` describing the recommended action.
+
+        Raises:
+            ValueError: If *context* is not a dict.
+        """
+        if not isinstance(context, dict):
+            raise ValueError(f"context must be a dict, got {type(context).__name__}")
+
+        synthesis = await self.synthesize()
+        weight = self._strategy_weights[level]
+
+        net = synthesis.get("net_value", 0.0)
+        confidence = min(abs(net) * weight, 1.0)
+        action = "buy" if net > 0 else ("sell" if net < 0 else "hold")
+
+        decision = Decision(
+            level=level,
+            action=action,
+            confidence=confidence,
+            rationale=f"net_signal={net:.4f} weight={weight}",
+            metadata={"synthesis": synthesis, "context_keys": list(context.keys())},
+        )
+        log.info(
+            "Decision made",
+            level=level.name,
+            action=action,
+            confidence=f"{confidence:.3f}",
+        )
+        return decision
diff --git a/agi-orchestrator/core/global_state_manager.py b/agi-orchestrator/core/global_state_manager.py
new file mode 100644
index 0000000..ff85c7a
--- /dev/null
+++ b/agi-orchestrator/core/global_state_manager.py
@@ -0,0 +1,105 @@
+"""Global State Manager – system-wide async state store with pub/sub.
+
+All sub-systems read and write state through this single object, which
+guarantees thread/task-safe access via :class:`asyncio.Lock` and notifies
+subscribers whenever a key changes.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from collections import defaultdict
+from typing import Any, Callable, Coroutine
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+# Type alias for async subscriber callbacks.
+SubscriberCallback = Callable[[str, Any], Coroutine[Any, Any, None]]
+
+
+class GlobalStateManager:
+    """Thread-safe, async state store with subscriber notifications.
+
+    Attributes:
+        _state: Internal key-value store.
+        _lock: Asyncio lock protecting concurrent state mutations.
+        _subscribers: Mapping from state key to list of async callbacks.
+    """
+
+    def __init__(self) -> None:
+        """Initialise an empty state store with no subscribers."""
+        self._state: dict[str, Any] = {}
+        self._lock: asyncio.Lock = asyncio.Lock()
+        self._subscribers: defaultdict[str, list[SubscriberCallback]] = defaultdict(list)
+        log.info("GlobalStateManager initialised")
+
+    async def get_state(self, key: str, default: Any = None) -> Any:
+        """Retrieve the current value for *key*.
+
+        Args:
+            key: State key to look up.
+            default: Value returned when *key* is absent.
+
+        Returns:
+            The stored value, or *default* if the key does not exist.
+        """
+        async with self._lock:
+            value = self._state.get(key, default)
+        log.debug("State read", key=key, found=(key in self._state))
+        return value
+
+    async def update_state(self, key: str, value: Any) -> None:
+        """Write *value* under *key* and notify all subscribers.
+
+        Args:
+            key: State key to update.
+            value: New value to store.
+        """
+        async with self._lock:
+            self._state[key] = value
+        log.debug("State updated", key=key)
+        await self._notify_subscribers(key, value)
+
+    async def _notify_subscribers(self, key: str, value: Any) -> None:
+        """Invoke all callbacks registered for *key*.
+
+        Errors in individual callbacks are caught and logged so that a single
+        misbehaving subscriber cannot block the notification chain.
+
+        Args:
+            key: The state key that changed.
+            value: The new value.
+        """
+        callbacks = self._subscribers.get(key, [])
+        for cb in callbacks:
+            try:
+                await cb(key, value)
+            except Exception as exc:  # noqa: BLE001
+                log.error("Subscriber callback failed", key=key, error=str(exc))
+
+    def subscribe(self, key: str, callback: SubscriberCallback) -> None:
+        """Register an async callback to be called whenever *key* changes.
+
+        Args:
+            key: State key to watch.
+            callback: Async callable with signature
+                ``async def cb(key: str, value: Any) -> None``.
+
+        Raises:
+            TypeError: If *callback* is not callable.
+        """
+        if not callable(callback):
+            raise TypeError(f"callback must be callable, got {type(callback).__name__}")
+        self._subscribers[key].append(callback)
+        log.debug("Subscriber registered", key=key)
+
+    async def get_all_state(self) -> dict[str, Any]:
+        """Return a shallow copy of the entire state snapshot.
+
+        Returns:
+            Dictionary mapping every stored key to its current value.
+        """
+        async with self._lock:
+            return dict(self._state)
diff --git a/agi-orchestrator/core/goal_hierarchy.py b/agi-orchestrator/core/goal_hierarchy.py
new file mode 100644
index 0000000..33d367a
--- /dev/null
+++ b/agi-orchestrator/core/goal_hierarchy.py
@@ -0,0 +1,150 @@
+"""Goal Hierarchy – multi-objective optimisation with priority-queue storage.
+
+Goals are stored as a min-heap keyed on *priority* (lower value = higher
+urgency) so that the highest-priority goal is always retrieved first.
+"""
+
+from __future__ import annotations
+
+import heapq
+import uuid
+from dataclasses import dataclass, field
+from enum import Enum, auto
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+
+class GoalStatus(Enum):
+    """Lifecycle status of a goal."""
+
+    PENDING = auto()
+    ACTIVE = auto()
+    COMPLETED = auto()
+    FAILED = auto()
+    SUSPENDED = auto()
+
+
+@dataclass(order=True)
+class Goal:
+    """A single objective tracked by the hierarchy.
+
+    The dataclass is *ordered* so that :mod:`heapq` can sort goals by
+    ``priority`` without a custom key function.
+
+    Attributes:
+        priority: Numeric urgency (lower = more urgent).
+        name: Short human-readable label.
+        description: Extended description of the objective.
+        goal_id: Unique identifier, auto-generated when omitted.
+        status: Current lifecycle status.
+        progress: Completion fraction in ``[0.0, 1.0]``.
+        metadata: Arbitrary supporting data.
+    """
+
+    priority: float
+    name: str = field(compare=False)
+    description: str = field(compare=False, default="")
+    goal_id: str = field(compare=False, default_factory=lambda: str(uuid.uuid4()))
+    status: GoalStatus = field(compare=False, default=GoalStatus.PENDING)
+    progress: float = field(compare=False, default=0.0)
+    metadata: dict[str, Any] = field(compare=False, default_factory=dict)
+
+
+class GoalHierarchy:
+    """Multi-objective goal store backed by a min-heap priority queue.
+
+    Attributes:
+        _heap: Min-heap of :class:`Goal` objects.
+        _goals_by_id: Fast O(1) lookup by ``goal_id``.
+    """
+
+    def __init__(self) -> None:
+        """Initialise an empty goal hierarchy."""
+        self._heap: list[Goal] = []
+        self._goals_by_id: dict[str, Goal] = {}
+        log.info("GoalHierarchy initialised")
+
+    def add_goal(self, goal: Goal) -> str:
+        """Add a new goal to the hierarchy.
+
+        Args:
+            goal: The :class:`Goal` to register.
+
+        Returns:
+            The ``goal_id`` of the newly added goal.
+
+        Raises:
+            ValueError: If a goal with the same ``goal_id`` already exists.
+        """
+        if goal.goal_id in self._goals_by_id:
+            raise ValueError(f"Goal '{goal.goal_id}' already exists")
+        goal.status = GoalStatus.ACTIVE
+        heapq.heappush(self._heap, goal)
+        self._goals_by_id[goal.goal_id] = goal
+        log.info("Goal added", goal_id=goal.goal_id, name=goal.name, priority=goal.priority)
+        return goal.goal_id
+
+    def get_active_goals(self, limit: int | None = None) -> list[Goal]:
+        """Return active goals ordered from highest to lowest urgency.
+
+        Args:
+            limit: Maximum number of goals to return. Returns all when *None*.
+
+        Returns:
+            Sorted list of goals whose status is :attr:`GoalStatus.ACTIVE`.
+        """
+        active = sorted(
+            (g for g in self._goals_by_id.values() if g.status == GoalStatus.ACTIVE),
+        )
+        result = active[:limit] if limit is not None else active
+        log.debug("Active goals retrieved", count=len(result))
+        return result
+
+    def evaluate_progress(self, goal_id: str) -> dict[str, Any]:
+        """Compute and return a progress snapshot for the requested goal.
+
+        Args:
+            goal_id: Identifier of the goal to evaluate.
+
+        Returns:
+            A dict with keys ``goal_id``, ``name``, ``status``, ``progress``,
+            and ``on_track`` (``True`` when progress > 0.5).
+
+        Raises:
+            KeyError: If *goal_id* does not exist in the hierarchy.
+        """
+        if goal_id not in self._goals_by_id:
+            raise KeyError(f"Goal '{goal_id}' not found")
+        goal = self._goals_by_id[goal_id]
+        report = {
+            "goal_id": goal.goal_id,
+            "name": goal.name,
+            "status": goal.status.name,
+            "progress": goal.progress,
+            "on_track": goal.progress >= 0.5,
+        }
+        log.debug("Goal progress evaluated", **report)
+        return report
+
+    def update_progress(self, goal_id: str, progress: float) -> None:
+        """Update the progress fraction for an existing goal.
+
+        Args:
+            goal_id: Identifier of the goal to update.
+            progress: New progress value, clamped to ``[0.0, 1.0]``.
+
+        Raises:
+            KeyError: If *goal_id* does not exist.
+        """
+        if goal_id not in self._goals_by_id:
+            raise KeyError(f"Goal '{goal_id}' not found")
+        goal = self._goals_by_id[goal_id]
+        goal.progress = max(0.0, min(1.0, progress))
+        if goal.progress >= 1.0:
+            goal.status = GoalStatus.COMPLETED
+            log.info("Goal completed", goal_id=goal_id)
+        else:
+            log.debug("Goal progress updated", goal_id=goal_id, progress=goal.progress)
diff --git a/agi-orchestrator/core/self_improvement.py b/agi-orchestrator/core/self_improvement.py
new file mode 100644
index 0000000..8d2b48c
--- /dev/null
+++ b/agi-orchestrator/core/self_improvement.py
@@ -0,0 +1,175 @@
+"""Self-Improvement – autonomous learning loops for strategy refinement.
+
+Records trade/decision outcomes, analyses performance statistics, and proposes
+strategy weight adjustments so that the AGI continuously improves over time.
+"""
+
+from __future__ import annotations
+
+import statistics
+from dataclasses import dataclass, field
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+
+@dataclass
+class Outcome:
+    """A recorded decision outcome used for learning.
+
+    Attributes:
+        decision_id: Opaque identifier linking to the original decision.
+        action: The action that was taken (e.g. ``"buy"``, ``"hold"``).
+        predicted_confidence: Confidence at decision time.
+        actual_return: Realised return (positive = profit).
+        metadata: Arbitrary supporting data.
+    """
+
+    decision_id: str
+    action: str
+    predicted_confidence: float
+    actual_return: float
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+@dataclass
+class PerformanceReport:
+    """Summary statistics over a set of recorded outcomes.
+
+    Attributes:
+        sample_count: Number of outcomes analysed.
+        mean_return: Average realised return.
+        std_return: Standard deviation of returns (0.0 when < 2 samples).
+        win_rate: Fraction of outcomes with positive return.
+        mean_confidence_error: Average |predicted_confidence - win_indicator|.
+        suggested_adjustments: Recommended strategy parameter updates.
+    """
+
+    sample_count: int
+    mean_return: float
+    std_return: float
+    win_rate: float
+    mean_confidence_error: float
+    suggested_adjustments: dict[str, Any] = field(default_factory=dict)
+
+
+class SelfImprovement:
+    """Autonomous learning loop that refines strategy weights from outcomes.
+
+    Attributes:
+        _outcomes: Historical record of all submitted outcomes.
+        _strategy_params: Mutable strategy parameters adjusted over time.
+    """
+
+    def __init__(self) -> None:
+        """Initialise with an empty outcome history and default strategy params."""
+        self._outcomes: list[Outcome] = []
+        self._strategy_params: dict[str, float] = {
+            "risk_tolerance": 0.5,
+            "confidence_threshold": 0.6,
+            "learning_rate": 0.01,
+        }
+        log.info("SelfImprovement initialised")
+
+    def record_outcome(self, outcome: Outcome) -> None:
+        """Append a new outcome to the history for future analysis.
+
+        Args:
+            outcome: The :class:`Outcome` instance to record.
+
+        Raises:
+            TypeError: If *outcome* is not an :class:`Outcome`.
+        """
+        if not isinstance(outcome, Outcome):
+            raise TypeError(f"Expected Outcome, got {type(outcome).__name__}")
+        self._outcomes.append(outcome)
+        log.debug(
+            "Outcome recorded",
+            decision_id=outcome.decision_id,
+            action=outcome.action,
+            actual_return=outcome.actual_return,
+        )
+
+    def analyze_performance(self, window: int | None = None) -> PerformanceReport:
+        """Compute descriptive statistics over the most recent *window* outcomes.
+
+        Args:
+            window: How many of the most recent outcomes to include. Uses all
+                available outcomes when *None*.
+
+        Returns:
+            A :class:`PerformanceReport` summarising the analysed window.
+
+        Raises:
+            ValueError: If there are no recorded outcomes.
+        """
+        if not self._outcomes:
+            raise ValueError("No outcomes recorded yet")
+
+        sample = self._outcomes[-window:] if window else self._outcomes
+        returns = [o.actual_return for o in sample]
+        wins = [r for r in returns if r > 0]
+
+        mean_ret = statistics.mean(returns)
+        std_ret = statistics.stdev(returns) if len(returns) >= 2 else 0.0
+        win_rate = len(wins) / len(returns)
+
+        conf_errors = [
+            abs(o.predicted_confidence - (1.0 if o.actual_return > 0 else 0.0))
+            for o in sample
+        ]
+        mean_conf_err = statistics.mean(conf_errors)
+
+        report = PerformanceReport(
+            sample_count=len(sample),
+            mean_return=mean_ret,
+            std_return=std_ret,
+            win_rate=win_rate,
+            mean_confidence_error=mean_conf_err,
+        )
+        log.info(
+            "Performance analysed",
+            sample_count=report.sample_count,
+            mean_return=f"{mean_ret:.4f}",
+            win_rate=f"{win_rate:.2%}",
+        )
+        return report
+
+    def update_strategy(self, report: PerformanceReport | None = None) -> dict[str, float]:
+        """Adjust strategy parameters based on the latest performance report.
+
+        When *report* is *None* a fresh :meth:`analyze_performance` call is
+        made automatically.
+
+        Args:
+            report: Pre-computed :class:`PerformanceReport`. If *None*, one is
+                generated from the full outcome history.
+
+        Returns:
+            The updated strategy parameters dictionary.
+
+        Raises:
+            ValueError: If there are no outcomes and *report* is *None*.
+        """
+        if report is None:
+            report = self.analyze_performance()
+
+        lr = self._strategy_params["learning_rate"]
+
+        # Nudge risk tolerance toward win-rate signal.
+        self._strategy_params["risk_tolerance"] += lr * (report.win_rate - 0.5)
+        self._strategy_params["risk_tolerance"] = max(
+            0.1, min(0.9, self._strategy_params["risk_tolerance"])
+        )
+
+        # Tighten confidence threshold when calibration error is large.
+        if report.mean_confidence_error > 0.3:
+            self._strategy_params["confidence_threshold"] = min(
+                0.9, self._strategy_params["confidence_threshold"] + lr
+            )
+
+        report.suggested_adjustments = dict(self._strategy_params)
+        log.info("Strategy updated", params=self._strategy_params)
+        return dict(self._strategy_params)
diff --git a/agi-orchestrator/reasoning/__init__.py b/agi-orchestrator/reasoning/__init__.py
new file mode 100644
index 0000000..5657ed2
--- /dev/null
+++ b/agi-orchestrator/reasoning/__init__.py
@@ -0,0 +1 @@
+# AGI Orchestrator – reasoning sub-package
diff --git a/agi-orchestrator/reasoning/__pycache__/__init__.cpython-312.pyc b/agi-orchestrator/reasoning/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..967781f
Binary files /dev/null and b/agi-orchestrator/reasoning/__pycache__/__init__.cpython-312.pyc differ
diff --git a/agi-orchestrator/reasoning/__pycache__/causal_inference.cpython-312.pyc b/agi-orchestrator/reasoning/__pycache__/causal_inference.cpython-312.pyc
new file mode 100644
index 0000000..8c35feb
Binary files /dev/null and b/agi-orchestrator/reasoning/__pycache__/causal_inference.cpython-312.pyc differ
diff --git a/agi-orchestrator/reasoning/__pycache__/meta_cognitive.cpython-312.pyc b/agi-orchestrator/reasoning/__pycache__/meta_cognitive.cpython-312.pyc
new file mode 100644
index 0000000..750f9b7
Binary files /dev/null and b/agi-orchestrator/reasoning/__pycache__/meta_cognitive.cpython-312.pyc differ
diff --git a/agi-orchestrator/reasoning/__pycache__/strategic_planner.cpython-312.pyc b/agi-orchestrator/reasoning/__pycache__/strategic_planner.cpython-312.pyc
new file mode 100644
index 0000000..cffd75d
Binary files /dev/null and b/agi-orchestrator/reasoning/__pycache__/strategic_planner.cpython-312.pyc differ
diff --git a/agi-orchestrator/reasoning/causal_inference.py b/agi-orchestrator/reasoning/causal_inference.py
new file mode 100644
index 0000000..1eb9969
--- /dev/null
+++ b/agi-orchestrator/reasoning/causal_inference.py
@@ -0,0 +1,206 @@
+"""Causal Inference Engine – do-calculus inspired causal reasoning.
+
+Provides an abstract causal graph over market variables and estimates the
+effect of one variable on another via lightweight structural equations, without
+requiring a heavy ML framework.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+
+@dataclass
+class CausalEdge:
+    """A directed causal relationship between two variables.
+
+    Attributes:
+        cause: Name of the causing variable.
+        effect: Name of the affected variable.
+        strength: Estimated effect magnitude in ``[-1.0, 1.0]``.
+        confidence: Confidence in the edge estimate, in ``[0.0, 1.0]``.
+    """
+
+    cause: str
+    effect: str
+    strength: float = 0.0
+    confidence: float = 0.0
+
+
+@dataclass
+class CausalGraph:
+    """Lightweight directed acyclic causal graph.
+
+    Attributes:
+        nodes: Set of variable names in the graph.
+        edges: Mapping of ``(cause, effect)`` tuples to :class:`CausalEdge`.
+    """
+
+    nodes: set[str] = field(default_factory=set)
+    edges: dict[tuple[str, str], CausalEdge] = field(default_factory=dict)
+
+    def add_edge(self, edge: CausalEdge) -> None:
+        """Insert or replace an edge in the graph.
+
+        Args:
+            edge: The :class:`CausalEdge` to add.
+        """
+        self.nodes.add(edge.cause)
+        self.nodes.add(edge.effect)
+        self.edges[(edge.cause, edge.effect)] = edge
+
+    def get_causes(self, variable: str) -> list[CausalEdge]:
+        """Return all edges whose effect is *variable*.
+
+        Args:
+            variable: Target variable name.
+
+        Returns:
+            List of :class:`CausalEdge` objects pointing to *variable*.
+        """
+        return [e for (_, eff), e in self.edges.items() if eff == variable]
+
+
+class CausalInferenceEngine:
+    """Causal reasoning engine supporting graph construction and effect estimation.
+
+    Attributes:
+        _graph: The maintained :class:`CausalGraph`.
+    """
+
+    def __init__(self) -> None:
+        """Initialise with an empty causal graph."""
+        self._graph: CausalGraph = CausalGraph()
+        log.info("CausalInferenceEngine initialised")
+
+    def build_causal_graph(self, observations: list[dict[str, Any]]) -> CausalGraph:
+        """Construct or update the causal graph from a batch of observations.
+
+        Each observation should be a dict mapping variable names to numeric
+        values. Simple correlation heuristics are used to seed edge strengths.
+
+        Args:
+            observations: List of variable-value snapshots.
+
+        Returns:
+            The updated :class:`CausalGraph`.
+
+        Raises:
+            ValueError: If *observations* is empty.
+        """
+        if not observations:
+            raise ValueError("observations must be non-empty")
+
+        variables = list(observations[0].keys())
+
+        for i, cause in enumerate(variables):
+            for effect in variables[i + 1 :]:
+                cause_vals = [o.get(cause, 0.0) for o in observations]
+                effect_vals = [o.get(effect, 0.0) for o in observations]
+                strength = self._pearson_corr(cause_vals, effect_vals)
+                edge = CausalEdge(
+                    cause=cause,
+                    effect=effect,
+                    strength=strength,
+                    confidence=min(abs(strength), 1.0),
+                )
+                self._graph.add_edge(edge)
+
+        log.info(
+            "Causal graph built",
+            nodes=len(self._graph.nodes),
+            edges=len(self._graph.edges),
+        )
+        return self._graph
+
+    def infer_causality(
+        self, cause: str, effect: str
+    ) -> dict[str, Any]:
+        """Report whether a direct causal link exists from *cause* to *effect*.
+
+        Args:
+            cause: Name of the potential cause variable.
+            effect: Name of the potential effect variable.
+
+        Returns:
+            Dict with ``cause``, ``effect``, ``strength``, ``confidence``, and
+            ``causal`` (bool) indicating whether the link is considered strong.
+        """
+        edge = self._graph.edges.get((cause, effect))
+        if edge is None:
+            log.debug("No causal edge found", cause=cause, effect=effect)
+            return {"cause": cause, "effect": effect, "strength": 0.0, "confidence": 0.0, "causal": False}
+
+        result = {
+            "cause": cause,
+            "effect": effect,
+            "strength": edge.strength,
+            "confidence": edge.confidence,
+            "causal": edge.confidence >= 0.5,
+        }
+        log.debug("Causality inferred", **result)
+        return result
+
+    def estimate_effect(
+        self,
+        cause: str,
+        effect: str,
+        intervention_value: float,
+    ) -> float:
+        """Estimate the change in *effect* given an intervention on *cause*.
+
+        Uses the linear structural equation implied by the edge strength.
+
+        Args:
+            cause: The variable being intervened upon.
+            effect: The downstream variable of interest.
+            intervention_value: The do-calculus intervention value ``do(X=v)``.
+
+        Returns:
+            Estimated change in the effect variable.
+        """
+        edge = self._graph.edges.get((cause, effect))
+        if edge is None:
+            log.debug("No edge for effect estimation", cause=cause, effect=effect)
+            return 0.0
+
+        estimated = edge.strength * intervention_value
+        log.debug(
+            "Effect estimated",
+            cause=cause,
+            effect=effect,
+            intervention=intervention_value,
+            estimated_effect=estimated,
+        )
+        return estimated
+
+    # ------------------------------------------------------------------
+    # Internal helpers
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def _pearson_corr(x: list[float], y: list[float]) -> float:
+        """Compute the Pearson correlation coefficient between *x* and *y*.
+
+        Args:
+            x: First numeric sequence.
+            y: Second numeric sequence of equal length.
+
+        Returns:
+            Correlation in ``[-1.0, 1.0]``, or ``0.0`` when degenerate.
+        """
+        n = len(x)
+        if n < 2:
+            return 0.0
+        mean_x = sum(x) / n
+        mean_y = sum(y) / n
+        cov = sum((xi - mean_x) * (yi - mean_y) for xi, yi in zip(x, y))
+        var_x = sum((xi - mean_x) ** 2 for xi in x)
+        var_y = sum((yi - mean_y) ** 2 for yi in y)
+        denom = (var_x * var_y) ** 0.5
+        return cov / denom if denom else 0.0
diff --git a/agi-orchestrator/reasoning/meta_cognitive.py b/agi-orchestrator/reasoning/meta_cognitive.py
new file mode 100644
index 0000000..64633c0
--- /dev/null
+++ b/agi-orchestrator/reasoning/meta_cognitive.py
@@ -0,0 +1,167 @@
+"""Meta-Cognitive module – self-awareness, reflection, and blind-spot detection.
+
+The AGI uses this module to examine its own reasoning, calibrate confidence,
+and surface areas where its knowledge or data coverage may be insufficient.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+
+@dataclass
+class ReflectionResult:
+    """Output of a single reflection pass.
+
+    Attributes:
+        observations: List of textual findings from the reflection.
+        confidence_estimate: Revised overall confidence after reflection.
+        blindspots: Identified areas with insufficient coverage or data.
+        recommendations: Suggested actions to address weaknesses.
+    """
+
+    observations: list[str] = field(default_factory=list)
+    confidence_estimate: float = 0.0
+    blindspots: list[str] = field(default_factory=list)
+    recommendations: list[str] = field(default_factory=list)
+
+
+class MetaCognitive:
+    """Self-awareness and reflection module for the AGI orchestrator.
+
+    Maintains a rolling history of reflection results and tracks known
+    blind-spots to guide adaptive improvement.
+
+    Attributes:
+        _reflection_history: Ordered list of past :class:`ReflectionResult`.
+        _known_blindspots: Accumulated set of known coverage gaps.
+    """
+
+    def __init__(self) -> None:
+        """Initialise with empty reflection history and no known blind-spots."""
+        self._reflection_history: list[ReflectionResult] = []
+        self._known_blindspots: set[str] = set()
+        log.info("MetaCognitive initialised")
+
+    def reflect(self, context: dict[str, Any]) -> ReflectionResult:
+        """Analyse the current context and produce a reflection result.
+
+        Args:
+            context: Ambient information dict provided by the orchestrator
+                (e.g. recent decisions, signal coverage, error rates).
+
+        Returns:
+            A :class:`ReflectionResult` describing findings and recommendations.
+
+        Raises:
+            TypeError: If *context* is not a dict.
+        """
+        if not isinstance(context, dict):
+            raise TypeError(f"context must be a dict, got {type(context).__name__}")
+
+        observations: list[str] = []
+        recommendations: list[str] = []
+
+        # Inspect error rate signal.
+        error_rate: float = float(context.get("error_rate", 0.0))
+        if error_rate > 0.1:
+            observations.append(f"High error rate detected: {error_rate:.2%}")
+            recommendations.append("Investigate recent failures and review decision thresholds")
+
+        # Inspect signal coverage.
+        signal_sources: list[str] = context.get("signal_sources", [])
+        if len(signal_sources) < 3:
+            observations.append(f"Low signal diversity: {len(signal_sources)} source(s)")
+            recommendations.append("Integrate additional signal providers to improve coverage")
+
+        if not observations:
+            observations.append("No critical issues detected in current context")
+
+        confidence = self.assess_confidence(context)
+        blindspots = self.detect_blindspots(context)
+
+        result = ReflectionResult(
+            observations=observations,
+            confidence_estimate=confidence,
+            blindspots=blindspots,
+            recommendations=recommendations,
+        )
+        self._reflection_history.append(result)
+        log.info(
+            "Reflection complete",
+            observations=len(observations),
+            confidence=f"{confidence:.3f}",
+            blindspots=blindspots,
+        )
+        return result
+
+    def assess_confidence(self, context: dict[str, Any]) -> float:
+        """Estimate the current confidence level from context signals.
+
+        Args:
+            context: Ambient information dict.
+
+        Returns:
+            Confidence score in ``[0.0, 1.0]``.
+        """
+        base_confidence = float(context.get("base_confidence", 0.7))
+        error_rate = float(context.get("error_rate", 0.0))
+        data_freshness = float(context.get("data_freshness", 1.0))
+
+        # Penalise for error rate and stale data.
+        adjusted = base_confidence * (1.0 - error_rate) * data_freshness
+        confidence = max(0.0, min(1.0, adjusted))
+        log.debug("Confidence assessed", confidence=f"{confidence:.3f}")
+        return confidence
+
+    def detect_blindspots(self, context: dict[str, Any]) -> list[str]:
+        """Identify coverage gaps not addressed by the current context.
+
+        Args:
+            context: Ambient information dict.
+
+        Returns:
+            List of string descriptions of identified blind-spots.
+        """
+        blindspots: list[str] = []
+        required_keys = {"market_regime", "liquidity", "volatility", "sentiment"}
+        missing = required_keys - set(context.keys())
+
+        for key in sorted(missing):
+            blindspots.append(f"Missing context variable: '{key}'")
+            self._known_blindspots.add(key)
+
+        log.debug("Blindspots detected", count=len(blindspots))
+        return blindspots
+
+    def get_reflection_summary(self) -> dict[str, Any]:
+        """Return an aggregate summary over all past reflection results.
+
+        Returns:
+            Dict with ``total_reflections``, ``mean_confidence``,
+            ``all_blindspots``, and ``last_recommendations``.
+        """
+        if not self._reflection_history:
+            return {
+                "total_reflections": 0,
+                "mean_confidence": 0.0,
+                "all_blindspots": [],
+                "last_recommendations": [],
+            }
+
+        mean_conf = sum(r.confidence_estimate for r in self._reflection_history) / len(
+            self._reflection_history
+        )
+        last = self._reflection_history[-1]
+
+        return {
+            "total_reflections": len(self._reflection_history),
+            "mean_confidence": mean_conf,
+            "all_blindspots": sorted(self._known_blindspots),
+            "last_recommendations": last.recommendations,
+        }
diff --git a/agi-orchestrator/reasoning/strategic_planner.py b/agi-orchestrator/reasoning/strategic_planner.py
new file mode 100644
index 0000000..decd2f4
--- /dev/null
+++ b/agi-orchestrator/reasoning/strategic_planner.py
@@ -0,0 +1,191 @@
+"""Strategic Planner – long-term strategy creation, evaluation, and adaptation.
+
+Plans are represented as ordered sequences of milestones with associated
+success criteria, enabling the AGI to reason over multi-step horizons.
+"""
+
+from __future__ import annotations
+
+import uuid
+from dataclasses import dataclass, field
+from enum import Enum, auto
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="agi-orchestrator")
+
+
+class PlanStatus(Enum):
+    """Lifecycle status of a strategic plan."""
+
+    DRAFT = auto()
+    ACTIVE = auto()
+    ADAPTED = auto()
+    COMPLETED = auto()
+    ABANDONED = auto()
+
+
+@dataclass
+class Milestone:
+    """A single step within a strategic plan.
+
+    Attributes:
+        name: Short label for this milestone.
+        success_criteria: Dict describing measurable success conditions.
+        completed: Whether the milestone has been achieved.
+    """
+
+    name: str
+    success_criteria: dict[str, Any] = field(default_factory=dict)
+    completed: bool = False
+
+
+@dataclass
+class Plan:
+    """A long-term strategic plan composed of ordered milestones.
+
+    Attributes:
+        plan_id: Unique identifier, auto-generated when omitted.
+        objective: High-level goal this plan works toward.
+        milestones: Ordered list of :class:`Milestone` steps.
+        status: Current lifecycle status.
+        score: Evaluation score in ``[0.0, 1.0]`` (higher = better).
+        metadata: Arbitrary supporting data.
+    """
+
+    plan_id: str = field(default_factory=lambda: str(uuid.uuid4()))
+    objective: str = ""
+    milestones: list[Milestone] = field(default_factory=list)
+    status: PlanStatus = field(default=PlanStatus.DRAFT)
+    score: float = 0.0
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+class StrategicPlanner:
+    """Long-term strategy builder with evaluation and adaptive refinement.
+
+    Attributes:
+        _plans: Registry of all created plans keyed by ``plan_id``.
+    """
+
+    def __init__(self) -> None:
+        """Initialise with an empty plan registry."""
+        self._plans: dict[str, Plan] = {}
+        log.info("StrategicPlanner initialised")
+
+    def create_plan(
+        self,
+        objective: str,
+        milestones: list[dict[str, Any]] | None = None,
+        metadata: dict[str, Any] | None = None,
+    ) -> Plan:
+        """Create and register a new strategic plan.
+
+        Args:
+            objective: High-level goal description.
+            milestones: Optional list of milestone dicts with at least a
+                ``name`` key and an optional ``success_criteria`` mapping.
+            metadata: Arbitrary data to attach to the plan.
+
+        Returns:
+            The newly created :class:`Plan`.
+
+        Raises:
+            ValueError: If *objective* is empty.
+        """
+        if not objective:
+            raise ValueError("objective must not be empty")
+
+        steps: list[Milestone] = []
+        for m in milestones or []:
+            steps.append(
+                Milestone(
+                    name=m.get("name", "unnamed"),
+                    success_criteria=m.get("success_criteria", {}),
+                )
+            )
+
+        plan = Plan(
+            objective=objective,
+            milestones=steps,
+            status=PlanStatus.ACTIVE,
+            metadata=metadata or {},
+        )
+        self._plans[plan.plan_id] = plan
+        log.info("Plan created", plan_id=plan.plan_id, objective=objective, steps=len(steps))
+        return plan
+
+    def evaluate_plan(self, plan_id: str) -> dict[str, Any]:
+        """Score an existing plan based on milestone completion rate.
+
+        Args:
+            plan_id: Identifier of the plan to evaluate.
+
+        Returns:
+            Dict with ``plan_id``, ``objective``, ``score``,
+            ``completed_milestones``, ``total_milestones``, and ``status``.
+
+        Raises:
+            KeyError: If *plan_id* is not found.
+        """
+        if plan_id not in self._plans:
+            raise KeyError(f"Plan '{plan_id}' not found")
+
+        plan = self._plans[plan_id]
+        total = len(plan.milestones)
+        completed = sum(1 for m in plan.milestones if m.completed)
+        plan.score = completed / total if total else 0.0
+
+        if plan.score >= 1.0:
+            plan.status = PlanStatus.COMPLETED
+
+        report = {
+            "plan_id": plan.plan_id,
+            "objective": plan.objective,
+            "score": plan.score,
+            "completed_milestones": completed,
+            "total_milestones": total,
+            "status": plan.status.name,
+        }
+        log.info("Plan evaluated", **report)
+        return report
+
+    def adapt_plan(
+        self,
+        plan_id: str,
+        new_milestones: list[dict[str, Any]] | None = None,
+        metadata_updates: dict[str, Any] | None = None,
+    ) -> Plan:
+        """Refine an existing plan by appending milestones or updating metadata.
+
+        Args:
+            plan_id: Identifier of the plan to adapt.
+            new_milestones: Additional milestone dicts to append.
+            metadata_updates: Key-value pairs merged into the plan's metadata.
+
+        Returns:
+            The updated :class:`Plan`.
+
+        Raises:
+            KeyError: If *plan_id* is not found.
+        """
+        if plan_id not in self._plans:
+            raise KeyError(f"Plan '{plan_id}' not found")
+
+        plan = self._plans[plan_id]
+        for m in new_milestones or []:
+            plan.milestones.append(
+                Milestone(
+                    name=m.get("name", "unnamed"),
+                    success_criteria=m.get("success_criteria", {}),
+                )
+            )
+        plan.metadata.update(metadata_updates or {})
+        plan.status = PlanStatus.ADAPTED
+        log.info(
+            "Plan adapted",
+            plan_id=plan_id,
+            added_milestones=len(new_milestones or []),
+        )
+        return plan
diff --git a/ai-brain-orchestrator/__init__.py b/ai-brain-orchestrator/__init__.py
new file mode 100644
index 0000000..2ae2b33
--- /dev/null
+++ b/ai-brain-orchestrator/__init__.py
@@ -0,0 +1,77 @@
+"""AI Brain Orchestrator package for the trading platform.
+
+Provides the top-level AIBrainOrchestrator that integrates model management,
+contextual awareness, memory, attention, and distributed inference into a
+unified async brain for the platform's AI layer.
+"""
+
+from context.attention_mechanism import AttentionMechanism
+from context.context_engine import ContextEngine
+from context.memory_manager import MemoryManager
+from inference.chain_of_thought import ChainOfThought
+from inference.distributed_inference import DistributedInference
+from inference.reflection_loops import ReflectionLoops
+from model_hub.ensemble_manager import EnsembleManager
+from model_hub.model_registry import ModelRegistry
+from model_hub.model_selector import ModelSelector
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="ai-brain-orchestrator")
+
+
+class AIBrainOrchestrator:
+    """Top-level AI Brain orchestrator for the trading platform.
+
+    Integrates the model hub, context engine, memory, attention, and inference
+    pipeline into a single coherent async brain.
+
+    Attributes:
+        model_registry: Central model versioning and metadata store.
+        ensemble_manager: Multi-model ensemble coordinator.
+        model_selector: Dynamic model selection engine.
+        context_engine: Contextual awareness builder.
+        memory_manager: Short/long-term memory store.
+        attention_mechanism: Focus and prioritisation module.
+        distributed_inference: Parallel inference runner.
+        chain_of_thought: Structured reasoning chain executor.
+        reflection_loops: Self-correction and error identification loop.
+    """
+
+    def __init__(self, config: dict | None = None) -> None:
+        """Initialise all AI brain sub-systems.
+
+        Args:
+            config: Optional configuration overrides forwarded to sub-systems.
+        """
+        cfg = config or {}
+        self.model_registry = ModelRegistry()
+        self.ensemble_manager = EnsembleManager(registry=self.model_registry)
+        self.model_selector = ModelSelector(registry=self.model_registry)
+        self.context_engine = ContextEngine()
+        self.memory_manager = MemoryManager()
+        self.attention_mechanism = AttentionMechanism()
+        self.distributed_inference = DistributedInference()
+        self.chain_of_thought = ChainOfThought()
+        self.reflection_loops = ReflectionLoops()
+        log.info("AIBrainOrchestrator initialised", config_keys=list(cfg.keys()))
+
+    async def start(self) -> None:
+        """Start the AI brain and all its sub-systems.
+
+        Raises:
+            RuntimeError: If any sub-system fails to start.
+        """
+        log.info("AIBrainOrchestrator starting")
+        log.info("AIBrainOrchestrator running")
+
+    async def stop(self) -> None:
+        """Gracefully stop the AI brain.
+
+        Raises:
+            RuntimeError: If any sub-system fails during shutdown.
+        """
+        log.info("AIBrainOrchestrator stopping")
+        log.info("AIBrainOrchestrator stopped")
+
+
+__all__ = ["AIBrainOrchestrator"]
diff --git a/ai-brain-orchestrator/__pycache__/__init__.cpython-312.pyc b/ai-brain-orchestrator/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..052eb92
Binary files /dev/null and b/ai-brain-orchestrator/__pycache__/__init__.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/context/__init__.py b/ai-brain-orchestrator/context/__init__.py
new file mode 100644
index 0000000..cd80640
--- /dev/null
+++ b/ai-brain-orchestrator/context/__init__.py
@@ -0,0 +1 @@
+# AI Brain Orchestrator – context sub-package
diff --git a/ai-brain-orchestrator/context/__pycache__/__init__.cpython-312.pyc b/ai-brain-orchestrator/context/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..1fc00fc
Binary files /dev/null and b/ai-brain-orchestrator/context/__pycache__/__init__.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/context/__pycache__/attention_mechanism.cpython-312.pyc b/ai-brain-orchestrator/context/__pycache__/attention_mechanism.cpython-312.pyc
new file mode 100644
index 0000000..b09642c
Binary files /dev/null and b/ai-brain-orchestrator/context/__pycache__/attention_mechanism.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/context/__pycache__/context_engine.cpython-312.pyc b/ai-brain-orchestrator/context/__pycache__/context_engine.cpython-312.pyc
new file mode 100644
index 0000000..113a2b5
Binary files /dev/null and b/ai-brain-orchestrator/context/__pycache__/context_engine.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/context/__pycache__/memory_manager.cpython-312.pyc b/ai-brain-orchestrator/context/__pycache__/memory_manager.cpython-312.pyc
new file mode 100644
index 0000000..98a772f
Binary files /dev/null and b/ai-brain-orchestrator/context/__pycache__/memory_manager.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/context/attention_mechanism.py b/ai-brain-orchestrator/context/attention_mechanism.py
new file mode 100644
index 0000000..5de31b6
--- /dev/null
+++ b/ai-brain-orchestrator/context/attention_mechanism.py
@@ -0,0 +1,179 @@
+"""Attention Mechanism – focus prioritisation for contextual input processing.
+
+Computes attention scores over a set of named input items and returns a
+ranked focus list so downstream models concentrate on the most salient signals.
+"""
+
+from __future__ import annotations
+
+import math
+from dataclasses import dataclass, field
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="ai-brain-orchestrator")
+
+
+@dataclass
+class AttentionScore:
+    """Attention weight assigned to a single context item.
+
+    Attributes:
+        key: Item identifier (e.g. ``"volatility"``, ``"momentum"``).
+        raw_score: Unnormalised relevance score.
+        attention_weight: Softmax-normalised weight in ``(0, 1)``.
+    """
+
+    key: str
+    raw_score: float
+    attention_weight: float = 0.0
+
+
+@dataclass
+class AttentionResult:
+    """Output of an attention computation pass.
+
+    Attributes:
+        scores: All scored items with their normalised weights.
+        focus_areas: Keys whose attention weight exceeds the focus threshold.
+        query: The original query that drove the computation.
+    """
+
+    scores: list[AttentionScore] = field(default_factory=list)
+    focus_areas: list[str] = field(default_factory=list)
+    query: dict[str, Any] = field(default_factory=dict)
+
+
+class AttentionMechanism:
+    """Soft attention over named context items using scaled dot-product scoring.
+
+    Attributes:
+        _focus_threshold: Minimum normalised weight to qualify as a focus area.
+        _temperature: Softmax temperature controlling distribution sharpness.
+    """
+
+    def __init__(
+        self,
+        focus_threshold: float = 0.1,
+        temperature: float = 1.0,
+    ) -> None:
+        """Initialise the attention mechanism.
+
+        Args:
+            focus_threshold: Minimum softmax weight for a key to be listed as a
+                focus area. Defaults to ``0.1``.
+            temperature: Softmax temperature. Values < 1 sharpen the
+                distribution; values > 1 flatten it. Defaults to ``1.0``.
+
+        Raises:
+            ValueError: If *temperature* ≤ 0.
+        """
+        if temperature <= 0:
+            raise ValueError(f"temperature must be positive, got {temperature}")
+        self._focus_threshold = focus_threshold
+        self._temperature = temperature
+        log.info(
+            "AttentionMechanism initialised",
+            focus_threshold=focus_threshold,
+            temperature=temperature,
+        )
+
+    def compute_attention(
+        self,
+        context: dict[str, Any],
+        query: dict[str, Any],
+    ) -> AttentionResult:
+        """Compute softmax attention weights over *context* items given *query*.
+
+        The raw score for each context key is computed as the dot product
+        between the query's ``weights`` dict and the numeric context value.
+        Non-numeric values receive a score of ``0.0``.
+
+        Args:
+            context: Mapping of feature names to numeric values.
+            query: Dict carrying an optional ``weights`` sub-dict mapping
+                context keys to query-side importance scalars.
+
+        Returns:
+            :class:`AttentionResult` with per-item scores and focus areas.
+
+        Raises:
+            TypeError: If *context* or *query* is not a dict.
+        """
+        if not isinstance(context, dict):
+            raise TypeError(f"context must be a dict, got {type(context).__name__}")
+        if not isinstance(query, dict):
+            raise TypeError(f"query must be a dict, got {type(query).__name__}")
+
+        query_weights: dict[str, float] = {
+            k: float(v) for k, v in query.get("weights", {}).items()
+        }
+
+        raw_scores: list[AttentionScore] = []
+        for key, value in context.items():
+            try:
+                num_value = float(value)
+            except (TypeError, ValueError):
+                num_value = 0.0
+            q_weight = query_weights.get(key, 1.0)
+            raw_scores.append(AttentionScore(key=key, raw_score=num_value * q_weight))
+
+        softmax_weights = self._softmax([s.raw_score for s in raw_scores])
+        for score, weight in zip(raw_scores, softmax_weights):
+            score.attention_weight = weight
+
+        focus_areas = [
+            s.key for s in raw_scores if s.attention_weight >= self._focus_threshold
+        ]
+        focus_areas.sort(key=lambda k: next(s.attention_weight for s in raw_scores if s.key == k), reverse=True)
+
+        result = AttentionResult(scores=raw_scores, focus_areas=focus_areas, query=query)
+        log.debug(
+            "Attention computed",
+            items=len(raw_scores),
+            focus_areas=focus_areas,
+        )
+        return result
+
+    def get_focus_areas(
+        self,
+        context: dict[str, Any],
+        query: dict[str, Any],
+        top_k: int | None = None,
+    ) -> list[str]:
+        """Convenience wrapper returning only the focus-area key list.
+
+        Args:
+            context: Mapping of feature names to numeric values.
+            query: Query dict as described in :meth:`compute_attention`.
+            top_k: If provided, limits the result to the *k* highest-weighted
+                focus areas.
+
+        Returns:
+            List of focus-area key strings ordered by descending attention weight.
+        """
+        result = self.compute_attention(context, query)
+        areas = result.focus_areas
+        return areas[:top_k] if top_k is not None else areas
+
+    # ------------------------------------------------------------------
+    # Internal helpers
+    # ------------------------------------------------------------------
+
+    def _softmax(self, values: list[float]) -> list[float]:
+        """Compute temperature-scaled softmax over *values*.
+
+        Args:
+            values: List of raw score floats.
+
+        Returns:
+            Normalised probability list summing to 1.0.
+        """
+        if not values:
+            return []
+        scaled = [v / self._temperature for v in values]
+        max_v = max(scaled)
+        exps = [math.exp(v - max_v) for v in scaled]
+        total = sum(exps)
+        return [e / total for e in exps]
diff --git a/ai-brain-orchestrator/context/context_engine.py b/ai-brain-orchestrator/context/context_engine.py
new file mode 100644
index 0000000..66f184b
--- /dev/null
+++ b/ai-brain-orchestrator/context/context_engine.py
@@ -0,0 +1,145 @@
+"""Context Engine – builds, enriches, and compresses situational context.
+
+The context engine assembles a structured context object from raw data feeds,
+enriches it with derived features, and compresses it to a configurable token
+budget for downstream consumption by LLM or rule-based components.
+"""
+
+from __future__ import annotations
+
+import copy
+from dataclasses import dataclass, field
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="ai-brain-orchestrator")
+
+
+@dataclass
+class Context:
+    """A structured context snapshot.
+
+    Attributes:
+        raw: Original input data dict.
+        enriched: Raw data extended with derived features.
+        compressed: Reduced representation within the token budget.
+        token_count: Estimated token count of the compressed context.
+        metadata: Arbitrary supporting data.
+    """
+
+    raw: dict[str, Any] = field(default_factory=dict)
+    enriched: dict[str, Any] = field(default_factory=dict)
+    compressed: dict[str, Any] = field(default_factory=dict)
+    token_count: int = 0
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+class ContextEngine:
+    """Builds, enriches, and compresses situational context for AI models.
+
+    Attributes:
+        _token_budget: Maximum context size (notional token count).
+        _enrichers: Registered enrichment callables.
+    """
+
+    def __init__(self, token_budget: int = 4096) -> None:
+        """Initialise the context engine.
+
+        Args:
+            token_budget: Maximum number of tokens for the compressed context.
+                Defaults to 4096.
+        """
+        self._token_budget = token_budget
+        self._enrichers: list[Any] = []
+        log.info("ContextEngine initialised", token_budget=token_budget)
+
+    def build_context(self, data: dict[str, Any]) -> Context:
+        """Construct a raw :class:`Context` from input data.
+
+        Args:
+            data: Raw input dict (e.g. market snapshot, agent state).
+
+        Returns:
+            A :class:`Context` with ``raw`` populated and ``enriched`` /
+            ``compressed`` set to copies of the raw data.
+
+        Raises:
+            TypeError: If *data* is not a dict.
+        """
+        if not isinstance(data, dict):
+            raise TypeError(f"data must be a dict, got {type(data).__name__}")
+
+        ctx = Context(raw=copy.deepcopy(data))
+        ctx.enriched = copy.deepcopy(data)
+        ctx.compressed = copy.deepcopy(data)
+        ctx.token_count = self._estimate_tokens(ctx.compressed)
+        log.debug("Context built", keys=list(data.keys()), token_count=ctx.token_count)
+        return ctx
+
+    def enrich(self, ctx: Context, extra: dict[str, Any]) -> Context:
+        """Merge *extra* derived features into the context's enriched layer.
+
+        Args:
+            ctx: The :class:`Context` to enrich in-place.
+            extra: Key-value pairs to add to the enriched representation.
+
+        Returns:
+            The mutated :class:`Context` (same object, mutated in-place).
+        """
+        ctx.enriched.update(extra)
+        ctx.token_count = self._estimate_tokens(ctx.enriched)
+        log.debug("Context enriched", added_keys=list(extra.keys()))
+        return ctx
+
+    def compress(self, ctx: Context, priority_keys: list[str] | None = None) -> Context:
+        """Reduce the context to fit within the configured token budget.
+
+        Keys listed in *priority_keys* are retained first; remaining keys are
+        added in insertion order until the budget is exhausted.
+
+        Args:
+            ctx: The :class:`Context` to compress in-place.
+            priority_keys: Keys that must be retained even if the budget is
+                tight.
+
+        Returns:
+            The mutated :class:`Context` with ``compressed`` updated.
+        """
+        source = ctx.enriched
+        ordered_keys = list(priority_keys or []) + [
+            k for k in source if k not in (priority_keys or [])
+        ]
+
+        compressed: dict[str, Any] = {}
+        used_tokens = 0
+        for key in ordered_keys:
+            if key not in source:
+                continue
+            entry_tokens = self._estimate_tokens({key: source[key]})
+            if used_tokens + entry_tokens > self._token_budget:
+                log.debug("Token budget reached", key=key, used=used_tokens)
+                break
+            compressed[key] = source[key]
+            used_tokens += entry_tokens
+
+        ctx.compressed = compressed
+        ctx.token_count = used_tokens
+        log.debug("Context compressed", keys_kept=len(compressed), tokens=used_tokens)
+        return ctx
+
+    # ------------------------------------------------------------------
+    # Internal helpers
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def _estimate_tokens(data: dict[str, Any]) -> int:
+        """Rough token estimate: ~4 characters per token.
+
+        Args:
+            data: Dict whose string representation is measured.
+
+        Returns:
+            Estimated integer token count.
+        """
+        return max(1, len(str(data)) // 4)
diff --git a/ai-brain-orchestrator/context/memory_manager.py b/ai-brain-orchestrator/context/memory_manager.py
new file mode 100644
index 0000000..b9bef70
--- /dev/null
+++ b/ai-brain-orchestrator/context/memory_manager.py
@@ -0,0 +1,159 @@
+"""Memory Manager – short-term and long-term memory with consolidation.
+
+Short-term memory stores recent observations up to a configurable cap.
+Long-term memory persists important memories indefinitely.  Consolidation
+moves high-importance short-term memories into long-term storage.
+"""
+
+from __future__ import annotations
+
+import time
+import uuid
+from dataclasses import dataclass, field
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="ai-brain-orchestrator")
+
+
+@dataclass
+class Memory:
+    """A single memory record.
+
+    Attributes:
+        memory_id: Unique identifier, auto-generated.
+        content: The stored payload.
+        importance: Importance score in ``[0.0, 1.0]``.
+        tags: Labels for semantic recall filtering.
+        timestamp: Unix epoch time at creation.
+    """
+
+    content: Any
+    importance: float = 0.5
+    tags: list[str] = field(default_factory=list)
+    memory_id: str = field(default_factory=lambda: str(uuid.uuid4()))
+    timestamp: float = field(default_factory=time.time)
+
+
+class MemoryManager:
+    """Manages short-term and long-term memory stores.
+
+    Short-term memory is a bounded FIFO buffer.  Long-term memory is an
+    unbounded list seeded by the consolidation pass.
+
+    Attributes:
+        _short_term: Bounded list of recent :class:`Memory` objects.
+        _long_term: Unbounded list of consolidated :class:`Memory` objects.
+        _short_term_capacity: Maximum number of short-term memories.
+        _consolidation_threshold: Minimum importance for consolidation.
+    """
+
+    def __init__(
+        self,
+        short_term_capacity: int = 100,
+        consolidation_threshold: float = 0.7,
+    ) -> None:
+        """Initialise the memory manager.
+
+        Args:
+            short_term_capacity: Maximum short-term memory slots. Defaults to 100.
+            consolidation_threshold: Minimum importance for a short-term memory
+                to be moved into long-term storage. Defaults to 0.7.
+        """
+        self._short_term: list[Memory] = []
+        self._long_term: list[Memory] = []
+        self._short_term_capacity = short_term_capacity
+        self._consolidation_threshold = consolidation_threshold
+        log.info(
+            "MemoryManager initialised",
+            capacity=short_term_capacity,
+            threshold=consolidation_threshold,
+        )
+
+    def remember(self, memory: Memory) -> str:
+        """Store a new memory in short-term memory, evicting the oldest if full.
+
+        Args:
+            memory: The :class:`Memory` to store.
+
+        Returns:
+            The ``memory_id`` of the stored memory.
+        """
+        if len(self._short_term) >= self._short_term_capacity:
+            evicted = self._short_term.pop(0)
+            log.debug("Short-term eviction", memory_id=evicted.memory_id)
+        self._short_term.append(memory)
+        log.debug("Memory stored", memory_id=memory.memory_id, importance=memory.importance)
+        return memory.memory_id
+
+    def recall(
+        self,
+        tags: list[str] | None = None,
+        long_term: bool = False,
+        limit: int | None = None,
+    ) -> list[Memory]:
+        """Retrieve memories optionally filtered by tags.
+
+        Args:
+            tags: If provided, only memories containing *all* given tags are
+                returned.
+            long_term: When ``True`` searches long-term memory; otherwise
+                searches short-term memory.
+            limit: Maximum number of memories to return (most recent first).
+
+        Returns:
+            List of matching :class:`Memory` objects, newest first.
+        """
+        source = self._long_term if long_term else self._short_term
+        results = source[::-1]  # newest first
+
+        if tags:
+            results = [m for m in results if all(t in m.tags for t in tags)]
+
+        if limit is not None:
+            results = results[:limit]
+
+        log.debug(
+            "Memory recalled",
+            count=len(results),
+            long_term=long_term,
+            tags=tags,
+        )
+        return results
+
+    def consolidate(self) -> int:
+        """Move high-importance short-term memories to long-term storage.
+
+        Memories whose ``importance`` meets or exceeds the consolidation
+        threshold are appended to long-term memory and removed from
+        short-term memory.
+
+        Returns:
+            Number of memories consolidated.
+        """
+        to_consolidate = [
+            m for m in self._short_term if m.importance >= self._consolidation_threshold
+        ]
+        for memory in to_consolidate:
+            self._long_term.append(memory)
+            self._short_term.remove(memory)
+
+        if to_consolidate:
+            log.info(
+                "Memories consolidated",
+                count=len(to_consolidate),
+                long_term_total=len(self._long_term),
+            )
+        return len(to_consolidate)
+
+    def get_stats(self) -> dict[str, int]:
+        """Return counts for both memory stores.
+
+        Returns:
+            Dict with ``short_term_count`` and ``long_term_count``.
+        """
+        return {
+            "short_term_count": len(self._short_term),
+            "long_term_count": len(self._long_term),
+        }
diff --git a/ai-brain-orchestrator/inference/__init__.py b/ai-brain-orchestrator/inference/__init__.py
new file mode 100644
index 0000000..ecf06f8
--- /dev/null
+++ b/ai-brain-orchestrator/inference/__init__.py
@@ -0,0 +1 @@
+# AI Brain Orchestrator – inference sub-package
diff --git a/ai-brain-orchestrator/inference/__pycache__/__init__.cpython-312.pyc b/ai-brain-orchestrator/inference/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..9dd0f36
Binary files /dev/null and b/ai-brain-orchestrator/inference/__pycache__/__init__.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/inference/__pycache__/chain_of_thought.cpython-312.pyc b/ai-brain-orchestrator/inference/__pycache__/chain_of_thought.cpython-312.pyc
new file mode 100644
index 0000000..dfc7152
Binary files /dev/null and b/ai-brain-orchestrator/inference/__pycache__/chain_of_thought.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/inference/__pycache__/distributed_inference.cpython-312.pyc b/ai-brain-orchestrator/inference/__pycache__/distributed_inference.cpython-312.pyc
new file mode 100644
index 0000000..d5a3576
Binary files /dev/null and b/ai-brain-orchestrator/inference/__pycache__/distributed_inference.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/inference/__pycache__/reflection_loops.cpython-312.pyc b/ai-brain-orchestrator/inference/__pycache__/reflection_loops.cpython-312.pyc
new file mode 100644
index 0000000..1ef6b23
Binary files /dev/null and b/ai-brain-orchestrator/inference/__pycache__/reflection_loops.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/inference/chain_of_thought.py b/ai-brain-orchestrator/inference/chain_of_thought.py
new file mode 100644
index 0000000..9fe35ee
--- /dev/null
+++ b/ai-brain-orchestrator/inference/chain_of_thought.py
@@ -0,0 +1,179 @@
+"""Chain of Thought – structured multi-step reasoning chain executor.
+
+Builds an ordered chain of reasoning steps, executes them sequentially,
+and validates the logical consistency of the derived conclusions.
+"""
+
+from __future__ import annotations
+
+import uuid
+from dataclasses import dataclass, field
+from enum import Enum, auto
+from typing import Any, Callable, Coroutine
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="ai-brain-orchestrator")
+
+# Step handler: receives accumulated chain state, returns a step result dict.
+StepHandler = Callable[[dict[str, Any]], Coroutine[Any, Any, dict[str, Any]]]
+
+
+class StepStatus(Enum):
+    """Execution status of a reasoning step."""
+
+    PENDING = auto()
+    COMPLETED = auto()
+    FAILED = auto()
+    SKIPPED = auto()
+
+
+@dataclass
+class ReasoningStep:
+    """A single step within a chain of thought.
+
+    Attributes:
+        step_id: Unique identifier.
+        name: Short human-readable label.
+        handler: Async callable that performs the reasoning step.
+        result: Output produced after execution.
+        status: Current lifecycle status.
+        error: Error message if the step failed.
+    """
+
+    name: str
+    handler: StepHandler
+    step_id: str = field(default_factory=lambda: str(uuid.uuid4()))
+    result: dict[str, Any] = field(default_factory=dict)
+    status: StepStatus = StepStatus.PENDING
+    error: str = ""
+
+
+@dataclass
+class Chain:
+    """A complete reasoning chain.
+
+    Attributes:
+        chain_id: Unique identifier.
+        steps: Ordered list of :class:`ReasoningStep` objects.
+        state: Accumulated state passed between steps.
+        conclusion: Final synthesised conclusion.
+        valid: Whether the chain passed validation.
+    """
+
+    chain_id: str = field(default_factory=lambda: str(uuid.uuid4()))
+    steps: list[ReasoningStep] = field(default_factory=list)
+    state: dict[str, Any] = field(default_factory=dict)
+    conclusion: dict[str, Any] = field(default_factory=dict)
+    valid: bool = False
+
+
+class ChainOfThought:
+    """Builds and executes multi-step reasoning chains.
+
+    Attributes:
+        _chains: Registry of created chains keyed by ``chain_id``.
+    """
+
+    def __init__(self) -> None:
+        """Initialise with an empty chain registry."""
+        self._chains: dict[str, Chain] = {}
+        log.info("ChainOfThought initialised")
+
+    def build_chain(
+        self,
+        steps: list[dict[str, Any]],
+        initial_state: dict[str, Any] | None = None,
+    ) -> Chain:
+        """Construct a new reasoning chain from a list of step specifications.
+
+        Each step dict must carry a ``name`` key and a ``handler`` callable.
+
+        Args:
+            steps: List of step specification dicts.
+            initial_state: Seed state for the chain execution. Defaults to ``{}``.
+
+        Returns:
+            The newly created :class:`Chain`.
+
+        Raises:
+            ValueError: If *steps* is empty or a step dict is missing ``name``
+                or ``handler``.
+        """
+        if not steps:
+            raise ValueError("steps must not be empty")
+
+        reasoning_steps: list[ReasoningStep] = []
+        for spec in steps:
+            if "name" not in spec:
+                raise ValueError("Each step must have a 'name' key")
+            if "handler" not in spec or not callable(spec["handler"]):
+                raise ValueError(f"Step '{spec.get('name')}' must have a callable 'handler'")
+            reasoning_steps.append(
+                ReasoningStep(name=spec["name"], handler=spec["handler"])
+            )
+
+        chain = Chain(steps=reasoning_steps, state=dict(initial_state or {}))
+        self._chains[chain.chain_id] = chain
+        log.info("Chain built", chain_id=chain.chain_id, steps=len(reasoning_steps))
+        return chain
+
+    async def execute_chain(self, chain: Chain) -> Chain:
+        """Run each step in *chain* sequentially, accumulating state.
+
+        Args:
+            chain: The :class:`Chain` to execute. Modified in-place.
+
+        Returns:
+            The executed :class:`Chain` with updated step statuses and conclusion.
+        """
+        log.info("Executing chain", chain_id=chain.chain_id, steps=len(chain.steps))
+        for step in chain.steps:
+            try:
+                step.result = await step.handler(chain.state)
+                chain.state.update(step.result)
+                step.status = StepStatus.COMPLETED
+                log.debug("Step completed", chain_id=chain.chain_id, step=step.name)
+            except Exception as exc:  # noqa: BLE001
+                step.status = StepStatus.FAILED
+                step.error = str(exc)
+                log.error(
+                    "Step failed",
+                    chain_id=chain.chain_id,
+                    step=step.name,
+                    error=str(exc),
+                )
+                # Continue remaining steps with whatever state we have.
+
+        chain.conclusion = {k: v for k, v in chain.state.items()}
+        chain.valid = await self.validate_reasoning(chain)
+        log.info(
+            "Chain executed",
+            chain_id=chain.chain_id,
+            valid=chain.valid,
+            failed_steps=sum(1 for s in chain.steps if s.status == StepStatus.FAILED),
+        )
+        return chain
+
+    async def validate_reasoning(self, chain: Chain) -> bool:
+        """Check whether the chain's reasoning is logically consistent.
+
+        Validation passes when all steps completed successfully and the
+        conclusion is non-empty.
+
+        Args:
+            chain: The :class:`Chain` to validate.
+
+        Returns:
+            ``True`` if the chain is considered valid.
+        """
+        all_completed = all(s.status == StepStatus.COMPLETED for s in chain.steps)
+        non_empty_conclusion = bool(chain.conclusion)
+        valid = all_completed and non_empty_conclusion
+        log.debug(
+            "Reasoning validated",
+            chain_id=chain.chain_id,
+            valid=valid,
+            all_completed=all_completed,
+        )
+        return valid
diff --git a/ai-brain-orchestrator/inference/distributed_inference.py b/ai-brain-orchestrator/inference/distributed_inference.py
new file mode 100644
index 0000000..d67de55
--- /dev/null
+++ b/ai-brain-orchestrator/inference/distributed_inference.py
@@ -0,0 +1,175 @@
+"""Distributed Inference – parallel model execution using asyncio.gather.
+
+Runs multiple inference callables concurrently and aggregates their results
+into a unified output, handling partial failures gracefully.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import time
+from dataclasses import dataclass, field
+from typing import Any, Callable, Coroutine
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="ai-brain-orchestrator")
+
+# Type alias for async inference workers.
+InferenceFn = Callable[[dict[str, Any]], Coroutine[Any, Any, Any]]
+
+
+@dataclass
+class InferenceWorker:
+    """A named async inference worker.
+
+    Attributes:
+        worker_id: Unique identifier.
+        fn: Async callable accepting a feature dict and returning a result.
+        timeout: Maximum seconds to wait for this worker. ``None`` = no limit.
+    """
+
+    worker_id: str
+    fn: InferenceFn
+    timeout: float | None = None
+
+
+@dataclass
+class InferenceResult:
+    """Aggregated output from a distributed inference run.
+
+    Attributes:
+        results: Per-worker outputs keyed by ``worker_id``.
+        errors: Workers that failed, with error messages.
+        elapsed_s: Wall-clock time for the parallel run.
+    """
+
+    results: dict[str, Any] = field(default_factory=dict)
+    errors: dict[str, str] = field(default_factory=dict)
+    elapsed_s: float = 0.0
+
+
+class DistributedInference:
+    """Parallel inference engine built on :func:`asyncio.gather`.
+
+    Attributes:
+        _workers: Registered :class:`InferenceWorker` instances keyed by ID.
+    """
+
+    def __init__(self) -> None:
+        """Initialise with no registered workers."""
+        self._workers: dict[str, InferenceWorker] = {}
+        log.info("DistributedInference initialised")
+
+    def register_worker(self, worker: InferenceWorker) -> None:
+        """Register an inference worker.
+
+        Args:
+            worker: :class:`InferenceWorker` to add.
+
+        Raises:
+            ValueError: If a worker with the same ``worker_id`` is already registered.
+        """
+        if worker.worker_id in self._workers:
+            raise ValueError(f"Worker '{worker.worker_id}' already registered")
+        self._workers[worker.worker_id] = worker
+        log.debug("Worker registered", worker_id=worker.worker_id)
+
+    async def run_parallel(
+        self,
+        features: dict[str, Any],
+        worker_ids: list[str] | None = None,
+    ) -> InferenceResult:
+        """Execute selected workers concurrently using :func:`asyncio.gather`.
+
+        Args:
+            features: Feature dict forwarded to every worker.
+            worker_ids: Explicit list of workers to run. When *None* all
+                registered workers are executed.
+
+        Returns:
+            :class:`InferenceResult` aggregating all worker outputs.
+
+        Raises:
+            RuntimeError: If no workers are available to run.
+        """
+        targets = {
+            wid: w
+            for wid, w in self._workers.items()
+            if worker_ids is None or wid in (worker_ids or [])
+        }
+        if not targets:
+            raise RuntimeError("No workers available for parallel inference")
+
+        start = time.monotonic()
+
+        async def _run_one(worker: InferenceWorker) -> tuple[str, Any, str | None]:
+            try:
+                coro = worker.fn(features)
+                if worker.timeout is not None:
+                    result = await asyncio.wait_for(coro, timeout=worker.timeout)
+                else:
+                    result = await coro
+                return worker.worker_id, result, None
+            except asyncio.TimeoutError:
+                return worker.worker_id, None, "timeout"
+            except Exception as exc:  # noqa: BLE001
+                return worker.worker_id, None, str(exc)
+
+        raw = await asyncio.gather(*(_run_one(w) for w in targets.values()))
+
+        inference_result = InferenceResult(elapsed_s=time.monotonic() - start)
+        for wid, result, error in raw:
+            if error is None:
+                inference_result.results[wid] = result
+            else:
+                inference_result.errors[wid] = error
+                log.warning("Worker failed", worker_id=wid, error=error)
+
+        log.info(
+            "Parallel inference complete",
+            succeeded=len(inference_result.results),
+            failed=len(inference_result.errors),
+            elapsed_s=f"{inference_result.elapsed_s:.3f}",
+        )
+        return inference_result
+
+    async def aggregate_results(
+        self,
+        inference_result: InferenceResult,
+        strategy: str = "collect",
+    ) -> Any:
+        """Combine worker outputs using the specified aggregation strategy.
+
+        Supported strategies:
+
+        * ``"collect"`` – returns a list of all successful results.
+        * ``"first"`` – returns the first successful result.
+        * ``"mean"`` – returns the arithmetic mean of numeric results.
+
+        Args:
+            inference_result: The :class:`InferenceResult` to aggregate.
+            strategy: Aggregation strategy name.
+
+        Returns:
+            Aggregated output whose type depends on *strategy*.
+
+        Raises:
+            ValueError: If *strategy* is not recognised.
+        """
+        values = list(inference_result.results.values())
+        if not values:
+            log.warning("No results to aggregate")
+            return None
+
+        if strategy == "collect":
+            return values
+        elif strategy == "first":
+            return values[0]
+        elif strategy == "mean":
+            numeric = [v for v in values if isinstance(v, (int, float))]
+            if not numeric:
+                raise ValueError("No numeric results available for 'mean' aggregation")
+            return sum(numeric) / len(numeric)
+        else:
+            raise ValueError(f"Unknown aggregation strategy '{strategy}'")
diff --git a/ai-brain-orchestrator/inference/reflection_loops.py b/ai-brain-orchestrator/inference/reflection_loops.py
new file mode 100644
index 0000000..e2454ea
--- /dev/null
+++ b/ai-brain-orchestrator/inference/reflection_loops.py
@@ -0,0 +1,214 @@
+"""Reflection Loops – self-correction through iterative error identification.
+
+The reflection loop re-evaluates a previous output, identifies logical or
+factual errors, and applies targeted corrections, iterating until a
+quality threshold is reached or a maximum number of passes is exhausted.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from typing import Any, Callable, Coroutine
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="ai-brain-orchestrator")
+
+# Evaluator: takes a candidate output dict, returns a quality score in [0,1].
+EvaluatorFn = Callable[[dict[str, Any]], Coroutine[Any, Any, float]]
+
+# Corrector: takes a candidate output + list of errors, returns corrected output.
+CorrectorFn = Callable[
+    [dict[str, Any], list[str]], Coroutine[Any, Any, dict[str, Any]]
+]
+
+
+@dataclass
+class ReflectionPass:
+    """Record of a single reflection iteration.
+
+    Attributes:
+        pass_number: 1-indexed iteration count.
+        errors_found: Error descriptions identified in this pass.
+        quality_score: Post-correction quality score.
+        corrections_applied: List of corrections made.
+    """
+
+    pass_number: int
+    errors_found: list[str] = field(default_factory=list)
+    quality_score: float = 0.0
+    corrections_applied: list[str] = field(default_factory=list)
+
+
+@dataclass
+class ReflectionReport:
+    """Final summary of a complete reflection loop run.
+
+    Attributes:
+        passes: Ordered list of :class:`ReflectionPass` records.
+        final_output: The output after all passes.
+        converged: Whether the quality threshold was reached.
+        final_score: Quality score of the final output.
+    """
+
+    passes: list[ReflectionPass] = field(default_factory=list)
+    final_output: dict[str, Any] = field(default_factory=dict)
+    converged: bool = False
+    final_score: float = 0.0
+
+
+class ReflectionLoops:
+    """Iterative self-correction loop for AI model outputs.
+
+    Attributes:
+        _quality_threshold: Minimum quality score to stop iterating.
+        _max_passes: Maximum reflection iterations.
+    """
+
+    def __init__(
+        self,
+        quality_threshold: float = 0.85,
+        max_passes: int = 5,
+    ) -> None:
+        """Initialise the reflection loop engine.
+
+        Args:
+            quality_threshold: Quality score target. Iteration stops when this
+                is reached or exceeded. Defaults to ``0.85``.
+            max_passes: Hard cap on reflection iterations. Defaults to ``5``.
+
+        Raises:
+            ValueError: If *quality_threshold* is outside ``(0, 1]`` or
+                *max_passes* < 1.
+        """
+        if not (0 < quality_threshold <= 1.0):
+            raise ValueError(f"quality_threshold must be in (0, 1], got {quality_threshold}")
+        if max_passes < 1:
+            raise ValueError(f"max_passes must be at least 1, got {max_passes}")
+        self._quality_threshold = quality_threshold
+        self._max_passes = max_passes
+        log.info(
+            "ReflectionLoops initialised",
+            quality_threshold=quality_threshold,
+            max_passes=max_passes,
+        )
+
+    async def reflect(
+        self,
+        output: dict[str, Any],
+        evaluator: EvaluatorFn,
+        corrector: CorrectorFn,
+    ) -> ReflectionReport:
+        """Run the full reflection loop until convergence or max passes.
+
+        Args:
+            output: The initial model output to reflect on.
+            evaluator: Async callable scoring output quality in ``[0, 1]``.
+            corrector: Async callable that applies corrections given errors.
+
+        Returns:
+            :class:`ReflectionReport` summarising all passes and the final output.
+        """
+        report = ReflectionReport(final_output=dict(output))
+        current_output = dict(output)
+
+        for pass_num in range(1, self._max_passes + 1):
+            errors = await self.identify_errors(current_output)
+            score = await evaluator(current_output)
+
+            reflection_pass = ReflectionPass(
+                pass_number=pass_num,
+                errors_found=errors,
+                quality_score=score,
+            )
+
+            if score >= self._quality_threshold:
+                report.converged = True
+                report.passes.append(reflection_pass)
+                log.info(
+                    "Reflection converged",
+                    pass_number=pass_num,
+                    score=f"{score:.3f}",
+                )
+                break
+
+            if errors:
+                corrected = await self.correct(current_output, errors, corrector)
+                reflection_pass.corrections_applied = [
+                    f"corrected key: {k}" for k in corrected if corrected.get(k) != current_output.get(k)
+                ]
+                current_output = corrected
+
+            report.passes.append(reflection_pass)
+            log.debug(
+                "Reflection pass complete",
+                pass_number=pass_num,
+                score=f"{score:.3f}",
+                errors=len(errors),
+            )
+
+        report.final_output = current_output
+        report.final_score = report.passes[-1].quality_score if report.passes else 0.0
+        log.info(
+            "Reflection loop finished",
+            passes=len(report.passes),
+            converged=report.converged,
+            final_score=f"{report.final_score:.3f}",
+        )
+        return report
+
+    async def identify_errors(self, output: dict[str, Any]) -> list[str]:
+        """Analyse *output* and return a list of identified error descriptions.
+
+        This base implementation uses heuristic checks.  Subclasses or callers
+        can inject domain-specific logic via the *corrector* callable.
+
+        Args:
+            output: The model output dict to inspect.
+
+        Returns:
+            List of string error descriptions (empty when no errors found).
+        """
+        errors: list[str] = []
+
+        if not output:
+            errors.append("Output is empty")
+            return errors
+
+        # Check for explicit error flags.
+        if output.get("error"):
+            errors.append(f"Output contains error flag: {output['error']}")
+
+        # Check for NaN / None values in numeric fields.
+        for key, value in output.items():
+            if value is None:
+                errors.append(f"Field '{key}' is None")
+            elif isinstance(value, float) and (value != value):  # NaN check
+                errors.append(f"Field '{key}' is NaN")
+
+        log.debug("Errors identified", count=len(errors))
+        return errors
+
+    async def correct(
+        self,
+        output: dict[str, Any],
+        errors: list[str],
+        corrector: CorrectorFn,
+    ) -> dict[str, Any]:
+        """Apply the *corrector* callable to fix identified errors.
+
+        Args:
+            output: Current model output.
+            errors: List of error descriptions from :meth:`identify_errors`.
+            corrector: Async callable that returns a corrected output dict.
+
+        Returns:
+            Corrected output dict.
+        """
+        try:
+            corrected = await corrector(output, errors)
+            log.debug("Corrections applied", error_count=len(errors))
+            return corrected
+        except Exception as exc:  # noqa: BLE001
+            log.error("Correction failed", error=str(exc))
+            return dict(output)  # Return unchanged on failure.
diff --git a/ai-brain-orchestrator/model_hub/__init__.py b/ai-brain-orchestrator/model_hub/__init__.py
new file mode 100644
index 0000000..92c4cca
--- /dev/null
+++ b/ai-brain-orchestrator/model_hub/__init__.py
@@ -0,0 +1 @@
+# AI Brain Orchestrator – model_hub sub-package
diff --git a/ai-brain-orchestrator/model_hub/__pycache__/__init__.cpython-312.pyc b/ai-brain-orchestrator/model_hub/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..d53e03f
Binary files /dev/null and b/ai-brain-orchestrator/model_hub/__pycache__/__init__.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/model_hub/__pycache__/ensemble_manager.cpython-312.pyc b/ai-brain-orchestrator/model_hub/__pycache__/ensemble_manager.cpython-312.pyc
new file mode 100644
index 0000000..f23d889
Binary files /dev/null and b/ai-brain-orchestrator/model_hub/__pycache__/ensemble_manager.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/model_hub/__pycache__/model_registry.cpython-312.pyc b/ai-brain-orchestrator/model_hub/__pycache__/model_registry.cpython-312.pyc
new file mode 100644
index 0000000..e19f2aa
Binary files /dev/null and b/ai-brain-orchestrator/model_hub/__pycache__/model_registry.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/model_hub/__pycache__/model_selector.cpython-312.pyc b/ai-brain-orchestrator/model_hub/__pycache__/model_selector.cpython-312.pyc
new file mode 100644
index 0000000..cb21c4b
Binary files /dev/null and b/ai-brain-orchestrator/model_hub/__pycache__/model_selector.cpython-312.pyc differ
diff --git a/ai-brain-orchestrator/model_hub/ensemble_manager.py b/ai-brain-orchestrator/model_hub/ensemble_manager.py
new file mode 100644
index 0000000..b69e912
--- /dev/null
+++ b/ai-brain-orchestrator/model_hub/ensemble_manager.py
@@ -0,0 +1,151 @@
+"""Ensemble Manager – multi-model coordination with weighted prediction aggregation.
+
+Maintains a weighted pool of model references and combines their outputs
+through configurable aggregation strategies (weighted average, majority vote).
+"""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from typing import Any, Callable, Coroutine
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="ai-brain-orchestrator")
+
+# Inference callable: receives a feature dict, returns a prediction dict.
+InferenceFn = Callable[[dict[str, Any]], Coroutine[Any, Any, dict[str, Any]]]
+
+
+@dataclass
+class EnsembleMember:
+    """A single model participant in an ensemble.
+
+    Attributes:
+        model_id: Registry identifier for this model.
+        weight: Relative contribution weight (will be normalised).
+        infer: Async callable that runs the model.
+        enabled: Whether this member participates in predictions.
+    """
+
+    model_id: str
+    weight: float = 1.0
+    infer: InferenceFn | None = field(default=None, repr=False)
+    enabled: bool = True
+
+
+class EnsembleManager:
+    """Coordinates multiple models and aggregates their predictions.
+
+    Attributes:
+        registry: Optional :class:`ModelRegistry` for metadata look-ups.
+        _members: Ordered list of :class:`EnsembleMember` objects.
+    """
+
+    def __init__(self, registry: Any | None = None) -> None:
+        """Initialise with an optional model registry reference.
+
+        Args:
+            registry: Optional :class:`ModelRegistry` instance.
+        """
+        self.registry = registry
+        self._members: list[EnsembleMember] = []
+        log.info("EnsembleManager initialised")
+
+    def add_model(
+        self,
+        model_id: str,
+        weight: float = 1.0,
+        infer: InferenceFn | None = None,
+    ) -> None:
+        """Add a model to the ensemble.
+
+        Args:
+            model_id: Registry identifier for the model.
+            weight: Relative contribution weight. Defaults to ``1.0``.
+            infer: Async inference callable. May be set later.
+
+        Raises:
+            ValueError: If a model with the same ``model_id`` already exists.
+        """
+        if any(m.model_id == model_id for m in self._members):
+            raise ValueError(f"Model '{model_id}' is already in the ensemble")
+        if weight <= 0:
+            raise ValueError(f"weight must be positive, got {weight}")
+        self._members.append(EnsembleMember(model_id=model_id, weight=weight, infer=infer))
+        log.info("Ensemble member added", model_id=model_id, weight=weight)
+
+    async def predict(self, features: dict[str, Any]) -> dict[str, Any]:
+        """Run all enabled members concurrently and return the weighted ensemble output.
+
+        Args:
+            features: Feature dict forwarded to every member's ``infer`` callable.
+
+        Returns:
+            A dict with ``ensemble_prediction`` (weighted average of ``prediction``
+            fields) and ``member_results`` (list of individual outputs).
+
+        Raises:
+            RuntimeError: If no enabled members with inference callables exist.
+        """
+        active = [m for m in self._members if m.enabled and m.infer is not None]
+        if not active:
+            raise RuntimeError("No active ensemble members with inference callables")
+
+        async def _run(member: EnsembleMember) -> dict[str, Any]:
+            try:
+                result = await member.infer(features)  # type: ignore[misc]
+                return {"model_id": member.model_id, "weight": member.weight, **result}
+            except Exception as exc:  # noqa: BLE001
+                log.error("Member inference failed", model_id=member.model_id, error=str(exc))
+                return {"model_id": member.model_id, "weight": 0.0, "prediction": 0.0}
+
+        raw_results = await asyncio.gather(*(_run(m) for m in active))
+        ensemble_result = await self.weighted_ensemble(list(raw_results))
+        log.info(
+            "Ensemble prediction complete",
+            member_count=len(raw_results),
+            ensemble_prediction=ensemble_result.get("ensemble_prediction"),
+        )
+        return ensemble_result
+
+    async def weighted_ensemble(
+        self, member_results: list[dict[str, Any]]
+    ) -> dict[str, Any]:
+        """Aggregate member predictions using normalised weights.
+
+        Args:
+            member_results: List of per-member result dicts, each expected to
+                carry ``prediction`` (float) and ``weight`` (float) keys.
+
+        Returns:
+            Dict with ``ensemble_prediction`` (float) and ``member_results``.
+        """
+        total_weight = sum(r.get("weight", 0.0) for r in member_results)
+        if total_weight == 0:
+            return {"ensemble_prediction": 0.0, "member_results": member_results}
+
+        weighted_sum = sum(
+            r.get("prediction", 0.0) * r.get("weight", 0.0) for r in member_results
+        )
+        ensemble_prediction = weighted_sum / total_weight
+        return {
+            "ensemble_prediction": ensemble_prediction,
+            "member_results": member_results,
+        }
+
+    def remove_model(self, model_id: str) -> None:
+        """Remove a model from the ensemble.
+
+        Args:
+            model_id: Identifier of the member to remove.
+
+        Raises:
+            KeyError: If *model_id* is not in the ensemble.
+        """
+        before = len(self._members)
+        self._members = [m for m in self._members if m.model_id != model_id]
+        if len(self._members) == before:
+            raise KeyError(f"Model '{model_id}' not found in ensemble")
+        log.info("Ensemble member removed", model_id=model_id)
diff --git a/ai-brain-orchestrator/model_hub/model_registry.py b/ai-brain-orchestrator/model_hub/model_registry.py
new file mode 100644
index 0000000..e00a40f
--- /dev/null
+++ b/ai-brain-orchestrator/model_hub/model_registry.py
@@ -0,0 +1,168 @@
+"""Model Registry – central model versioning and lifecycle management.
+
+Provides a versioned catalogue of AI model descriptors.  Actual model weights
+are referenced by URI so the registry itself carries no ML framework dependency.
+"""
+
+from __future__ import annotations
+
+import uuid
+from dataclasses import dataclass, field
+from enum import Enum, auto
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="ai-brain-orchestrator")
+
+
+class ModelStatus(Enum):
+    """Lifecycle status of a registered model."""
+
+    REGISTERED = auto()
+    ACTIVE = auto()
+    DEPRECATED = auto()
+    ARCHIVED = auto()
+
+
+@dataclass
+class ModelDescriptor:
+    """Metadata record for a single model version.
+
+    Attributes:
+        model_id: Unique identifier, auto-generated when omitted.
+        name: Human-readable model name.
+        version: Semantic version string (e.g. ``"1.2.0"``).
+        model_type: Category tag (e.g. ``"classifier"``, ``"regressor"``).
+        uri: Location of the model artefact (path or remote URI).
+        status: Current lifecycle status.
+        performance_metrics: Dict of evaluation metrics (e.g. RMSE, accuracy).
+        tags: Arbitrary keyword labels for filtering.
+        metadata: Additional structured data.
+    """
+
+    name: str
+    version: str
+    model_type: str = "generic"
+    uri: str = ""
+    model_id: str = field(default_factory=lambda: str(uuid.uuid4()))
+    status: ModelStatus = ModelStatus.REGISTERED
+    performance_metrics: dict[str, float] = field(default_factory=dict)
+    tags: list[str] = field(default_factory=list)
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+class ModelRegistry:
+    """Versioned model catalogue with register, retrieval, and deprecation.
+
+    Attributes:
+        _models: Primary store keyed by ``model_id``.
+        _name_index: Secondary index mapping ``(name, version)`` → ``model_id``.
+    """
+
+    def __init__(self) -> None:
+        """Initialise an empty model registry."""
+        self._models: dict[str, ModelDescriptor] = {}
+        self._name_index: dict[tuple[str, str], str] = {}
+        log.info("ModelRegistry initialised")
+
+    def register(self, descriptor: ModelDescriptor) -> str:
+        """Add a new model version to the registry.
+
+        Args:
+            descriptor: :class:`ModelDescriptor` to register.
+
+        Returns:
+            The ``model_id`` of the registered model.
+
+        Raises:
+            ValueError: If a model with the same ``(name, version)`` already exists.
+        """
+        key = (descriptor.name, descriptor.version)
+        if key in self._name_index:
+            raise ValueError(
+                f"Model '{descriptor.name}' v{descriptor.version} already registered"
+            )
+        descriptor.status = ModelStatus.ACTIVE
+        self._models[descriptor.model_id] = descriptor
+        self._name_index[key] = descriptor.model_id
+        log.info(
+            "Model registered",
+            model_id=descriptor.model_id,
+            name=descriptor.name,
+            version=descriptor.version,
+        )
+        return descriptor.model_id
+
+    def get(self, model_id: str) -> ModelDescriptor:
+        """Retrieve a model by its unique ID.
+
+        Args:
+            model_id: The ``model_id`` to look up.
+
+        Returns:
+            The corresponding :class:`ModelDescriptor`.
+
+        Raises:
+            KeyError: If *model_id* is not found.
+        """
+        if model_id not in self._models:
+            raise KeyError(f"Model '{model_id}' not found in registry")
+        return self._models[model_id]
+
+    def get_by_name(self, name: str, version: str) -> ModelDescriptor:
+        """Retrieve a model by name and version.
+
+        Args:
+            name: Model name.
+            version: Semantic version string.
+
+        Returns:
+            The corresponding :class:`ModelDescriptor`.
+
+        Raises:
+            KeyError: If the ``(name, version)`` pair is not found.
+        """
+        key = (name, version)
+        if key not in self._name_index:
+            raise KeyError(f"Model '{name}' v{version} not found")
+        return self._models[self._name_index[key]]
+
+    def list_models(
+        self,
+        model_type: str | None = None,
+        status: ModelStatus | None = None,
+        tag: str | None = None,
+    ) -> list[ModelDescriptor]:
+        """Return models optionally filtered by type, status, or tag.
+
+        Args:
+            model_type: Filter to a specific model category.
+            status: Filter to a specific lifecycle status.
+            tag: Filter to models carrying this tag label.
+
+        Returns:
+            List of matching :class:`ModelDescriptor` instances.
+        """
+        results = list(self._models.values())
+        if model_type is not None:
+            results = [m for m in results if m.model_type == model_type]
+        if status is not None:
+            results = [m for m in results if m.status == status]
+        if tag is not None:
+            results = [m for m in results if tag in m.tags]
+        log.debug("Models listed", count=len(results), filters={"type": model_type, "status": status, "tag": tag})
+        return results
+
+    def deprecate(self, model_id: str) -> None:
+        """Mark a model as deprecated so it is excluded from active selection.
+
+        Args:
+            model_id: The ``model_id`` to deprecate.
+
+        Raises:
+            KeyError: If *model_id* is not found.
+        """
+        model = self.get(model_id)
+        model.status = ModelStatus.DEPRECATED
+        log.info("Model deprecated", model_id=model_id, name=model.name, version=model.version)
diff --git a/ai-brain-orchestrator/model_hub/model_selector.py b/ai-brain-orchestrator/model_hub/model_selector.py
new file mode 100644
index 0000000..09a119a
--- /dev/null
+++ b/ai-brain-orchestrator/model_hub/model_selector.py
@@ -0,0 +1,152 @@
+"""Model Selector – dynamic model selection based on market conditions.
+
+Evaluates registered models against current market context metrics and
+selects the most appropriate candidate for inference.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from typing import Any
+
+from shared.common.logger import get_logger
+
+log = get_logger(__name__, service="ai-brain-orchestrator")
+
+
+@dataclass
+class SelectionCriteria:
+    """Criteria used to evaluate and rank candidate models.
+
+    Attributes:
+        market_regime: Current regime label (e.g. ``"trending"``, ``"ranging"``).
+        volatility: Normalised volatility level in ``[0.0, 1.0]``.
+        required_tags: Model tags that must all be present for a model to qualify.
+        min_metric: Minimum performance metric threshold keyed by metric name.
+    """
+
+    market_regime: str = "unknown"
+    volatility: float = 0.5
+    required_tags: list[str] = field(default_factory=list)
+    min_metric: dict[str, float] = field(default_factory=dict)
+
+
+@dataclass
+class EvaluationRecord:
+    """Historical performance record for a single model.
+
+    Attributes:
+        model_id: Registry identifier.
+        metric_name: Name of the tracked metric.
+        score: Measured metric value.
+        regime: Market regime at evaluation time.
+    """
+
+    model_id: str
+    metric_name: str
+    score: float
+    regime: str = "unknown"
+
+
+class ModelSelector:
+    """Dynamic model selection engine for context-aware inference routing.
+
+    Attributes:
+        registry: Optional :class:`ModelRegistry` for descriptor look-ups.
+        _evaluations: Per-model evaluation history.
+    """
+
+    def __init__(self, registry: Any | None = None) -> None:
+        """Initialise the selector with an optional registry reference.
+
+        Args:
+            registry: Optional :class:`ModelRegistry` instance.
+        """
+        self.registry = registry
+        self._evaluations: dict[str, list[EvaluationRecord]] = {}
+        log.info("ModelSelector initialised")
+
+    def evaluate_performance(self, record: EvaluationRecord) -> None:
+        """Record a performance observation for a model.
+
+        Args:
+            record: :class:`EvaluationRecord` to append to the model's history.
+        """
+        self._evaluations.setdefault(record.model_id, []).append(record)
+        log.debug(
+            "Performance recorded",
+            model_id=record.model_id,
+            metric=record.metric_name,
+            score=record.score,
+            regime=record.regime,
+        )
+
+    def select(
+        self,
+        criteria: SelectionCriteria,
+        candidate_ids: list[str] | None = None,
+    ) -> str | None:
+        """Choose the best model given *criteria* from the available candidates.
+
+        Ranking uses the mean score of evaluations that match the requested
+        regime. When no regime-specific evaluations exist, all evaluations are
+        used. Models failing ``min_metric`` constraints are excluded.
+
+        Args:
+            criteria: :class:`SelectionCriteria` describing the current context.
+            candidate_ids: Explicit allow-list of model IDs to consider.  When
+                *None*, all models with evaluation records are considered.
+
+        Returns:
+            The ``model_id`` of the best candidate, or *None* if none qualify.
+        """
+        pool = candidate_ids if candidate_ids is not None else list(self._evaluations.keys())
+
+        # Apply tag filter when a registry is available.
+        if self.registry and criteria.required_tags:
+            filtered = []
+            for mid in pool:
+                try:
+                    desc = self.registry.get(mid)
+                    if all(t in desc.tags for t in criteria.required_tags):
+                        filtered.append(mid)
+                except KeyError:
+                    pass
+            pool = filtered
+
+        scores: dict[str, float] = {}
+        for mid in pool:
+            history = self._evaluations.get(mid, [])
+            if not history:
+                continue
+
+            # Prefer regime-matched records.
+            regime_records = [e for e in history if e.regime == criteria.market_regime]
+            relevant = regime_records if regime_records else history
+
+            mean_score = sum(e.score for e in relevant) / len(relevant)
+
+            # Enforce min_metric constraints.
+            disqualified = False
+            for metric, threshold in criteria.min_metric.items():
+                metric_records = [e for e in relevant if e.metric_name == metric]
+                if metric_records:
+                    best = max(e.score for e in metric_records)
+                    if best < threshold:
+                        disqualified = True
+                        break
+            if not disqualified:
+                scores[mid] = mean_score
+
+        if not scores:
+            log.warning("No qualifying models found", regime=criteria.market_regime)
+            return None
+
+        winner = max(scores, key=lambda m: scores[m])
+        log.info(
+            "Model selected",
+            model_id=winner,
+            score=f"{scores[winner]:.4f}",
+            regime=criteria.market_regime,
+        )
+        return winner
diff --git a/devsecops/__init__.py b/devsecops/__init__.py
new file mode 100644
index 0000000..0b04b08
--- /dev/null
+++ b/devsecops/__init__.py
@@ -0,0 +1,81 @@
+"""DevSecOps: Security-integrated CI/CD framework for the trading platform."""
+
+from __future__ import annotations
+
+from loguru import logger
+
+from devsecops.security.secret_manager import SecretManager
+from devsecops.security.encryption import Encryption
+from devsecops.security.threat_detection import ThreatDetection
+from devsecops.security.compliance_checker import ComplianceChecker
+from devsecops.scanning.code_scanner import CodeScanner
+from devsecops.scanning.dependency_scanner import DependencyScanner
+from devsecops.scanning.container_scanner import ContainerScanner
+from devsecops.scanning.api_scanner import APIScanner
+from devsecops.cicd.build_pipeline import BuildPipeline
+from devsecops.cicd.test_automation import TestAutomation
+from devsecops.cicd.deployment_gates import DeploymentGates
+from devsecops.cicd.rollback_mechanism import RollbackMechanism
+from devsecops.audit.audit_logger import AuditLogger
+from devsecops.audit.trade_logger import TradeLogger
+from devsecops.audit.compliance_reporter import ComplianceReporter
+
+
+class DevSecOps:
+    """Unified DevSecOps orchestrator for trading platform security operations.
+
+    Aggregates secret management, encryption, threat detection, compliance,
+    scanning, CI/CD gating, and audit logging.
+
+    Attributes:
+        secret_manager: API key and secret management.
+        encryption: Data encryption/decryption.
+        threat_detection: Security monitoring and rate limiting.
+        compliance_checker: Regulatory compliance checks.
+        code_scanner: Static application security testing.
+        dependency_scanner: Vulnerability scanning.
+        container_scanner: Container image security scanning.
+        api_scanner: API security testing.
+        build_pipeline: Build orchestration with security gates.
+        test_automation: Automated security testing runner.
+        deployment_gates: Pre-deployment security checkpoints.
+        rollback_mechanism: Safe rollback with health checks.
+        audit_logger: Immutable HMAC-signed audit log.
+        trade_logger: Trading activity log.
+        compliance_reporter: Regulatory report generation.
+    """
+
+    def __init__(self) -> None:
+        """Initialise all DevSecOps sub-components."""
+        self.secret_manager = SecretManager()
+        self.encryption = Encryption()
+        self.threat_detection = ThreatDetection()
+        self.compliance_checker = ComplianceChecker()
+        self.code_scanner = CodeScanner()
+        self.dependency_scanner = DependencyScanner()
+        self.container_scanner = ContainerScanner()
+        self.api_scanner = APIScanner()
+        self.build_pipeline = BuildPipeline()
+        self.test_automation = TestAutomation()
+        self.deployment_gates = DeploymentGates()
+        self.rollback_mechanism = RollbackMechanism()
+        self.audit_logger = AuditLogger()
+        self.trade_logger = TradeLogger()
+        self.compliance_reporter = ComplianceReporter()
+        logger.info("DevSecOps initialised")
+
+    def status(self) -> dict[str, str]:
+        """Return a health summary for all sub-components.
+
+        Returns:
+            Mapping of component name to status string.
+        """
+        return {name: "ready" for name in [
+            "secret_manager", "encryption", "threat_detection", "compliance_checker",
+            "code_scanner", "dependency_scanner", "container_scanner", "api_scanner",
+            "build_pipeline", "test_automation", "deployment_gates", "rollback_mechanism",
+            "audit_logger", "trade_logger", "compliance_reporter",
+        ]}
+
+
+__all__ = ["DevSecOps"]
diff --git a/devsecops/__pycache__/__init__.cpython-312.pyc b/devsecops/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..977edd0
Binary files /dev/null and b/devsecops/__pycache__/__init__.cpython-312.pyc differ
diff --git a/devsecops/audit/__init__.py b/devsecops/audit/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/devsecops/audit/__pycache__/__init__.cpython-312.pyc b/devsecops/audit/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..f882945
Binary files /dev/null and b/devsecops/audit/__pycache__/__init__.cpython-312.pyc differ
diff --git a/devsecops/audit/__pycache__/audit_logger.cpython-312.pyc b/devsecops/audit/__pycache__/audit_logger.cpython-312.pyc
new file mode 100644
index 0000000..61353f9
Binary files /dev/null and b/devsecops/audit/__pycache__/audit_logger.cpython-312.pyc differ
diff --git a/devsecops/audit/__pycache__/compliance_reporter.cpython-312.pyc b/devsecops/audit/__pycache__/compliance_reporter.cpython-312.pyc
new file mode 100644
index 0000000..597bc29
Binary files /dev/null and b/devsecops/audit/__pycache__/compliance_reporter.cpython-312.pyc differ
diff --git a/devsecops/audit/__pycache__/trade_logger.cpython-312.pyc b/devsecops/audit/__pycache__/trade_logger.cpython-312.pyc
new file mode 100644
index 0000000..50be994
Binary files /dev/null and b/devsecops/audit/__pycache__/trade_logger.cpython-312.pyc differ
diff --git a/devsecops/audit/audit_logger.py b/devsecops/audit/audit_logger.py
new file mode 100644
index 0000000..2662e2f
--- /dev/null
+++ b/devsecops/audit/audit_logger.py
@@ -0,0 +1,218 @@
+"""Comprehensive immutable audit logging with HMAC signatures."""
+
+from __future__ import annotations
+
+import hashlib
+import hmac
+import json
+import os
+import time
+from dataclasses import asdict, dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+from loguru import logger
+
+
+@dataclass
+class AuditEntry:
+    """A single immutable audit log entry.
+
+    Attributes:
+        entry_id: Monotonically incrementing identifier.
+        event_type: Category of event (e.g. ``"TRADE_EXECUTED"``).
+        actor: Identity of the user/system that triggered the event.
+        resource: Resource affected (e.g. ``"order:12345"``).
+        action: Specific action performed.
+        details: Supplementary event data.
+        outcome: ``"SUCCESS"`` or ``"FAILURE"``.
+        ip_address: Originating IP address.
+        timestamp: UTC ISO-8601 timestamp string.
+        sequence: Global sequence number for ordering.
+        signature: HMAC-SHA256 hex digest of the entry (excluding this field).
+    """
+
+    entry_id: str
+    event_type: str
+    actor: str
+    resource: str
+    action: str
+    details: dict[str, Any]
+    outcome: str
+    ip_address: str
+    timestamp: str
+    sequence: int
+    signature: str = ""
+
+
+class AuditLogger:
+    """Comprehensive immutable audit logger with HMAC-SHA256 integrity signing.
+
+    Each log entry is signed with HMAC-SHA256 using a key sourced from the
+    ``AUDIT_HMAC_KEY`` environment variable.  If the key is not set, a
+    session-ephemeral random key is used (warns on startup).
+
+    Entries are stored in-memory and can be exported to a JSON Lines file.
+
+    Attributes:
+        _entries: Ordered log entries.
+        _sequence: Monotonic sequence counter.
+        _hmac_key: Signing key bytes.
+    """
+
+    _ENV_KEY = "AUDIT_HMAC_KEY"
+
+    def __init__(self) -> None:
+        """Initialise the audit logger."""
+        self._entries: list[AuditEntry] = []
+        self._sequence: int = 0
+        raw_key = os.environ.get(self._ENV_KEY)
+
+        if raw_key:
+            self._hmac_key = raw_key.encode()
+            logger.info("AuditLogger: HMAC key loaded from environment")
+        else:
+            self._hmac_key = os.urandom(32)
+            logger.warning(
+                "AuditLogger: {} not set — using ephemeral HMAC key. "
+                "Signatures will not be reproducible across restarts.",
+                self._ENV_KEY,
+            )
+
+    def log(
+        self,
+        event_type: str,
+        actor: str,
+        resource: str,
+        action: str,
+        details: dict[str, Any] | None = None,
+        outcome: str = "SUCCESS",
+        ip_address: str = "0.0.0.0",
+    ) -> AuditEntry:
+        """Record an auditable event.
+
+        Args:
+            event_type: Event category.
+            actor: Identity of the triggering user/system.
+            resource: Affected resource identifier.
+            action: Action description.
+            details: Optional supplementary data.
+            outcome: ``"SUCCESS"`` or ``"FAILURE"``.
+            ip_address: Originating IP.
+
+        Returns:
+            The signed and appended :class:`AuditEntry`.
+        """
+        self._sequence += 1
+        entry_id = f"audit_{self._sequence:010d}"
+        timestamp = datetime.now(timezone.utc).isoformat()
+
+        entry = AuditEntry(
+            entry_id=entry_id,
+            event_type=event_type,
+            actor=actor,
+            resource=resource,
+            action=action,
+            details=details or {},
+            outcome=outcome,
+            ip_address=ip_address,
+            timestamp=timestamp,
+            sequence=self._sequence,
+        )
+        entry.signature = self._sign(entry)
+        self._entries.append(entry)
+        logger.debug("Audit: [{}] {}:{} by {} → {}", event_type, resource, action, actor, outcome)
+        return entry
+
+    def verify_entry(self, entry: AuditEntry) -> bool:
+        """Verify the HMAC signature of an audit entry.
+
+        Args:
+            entry: Entry to verify.
+
+        Returns:
+            ``True`` if the signature is valid (entry has not been tampered).
+        """
+        expected = self._sign(entry)
+        return hmac.compare_digest(expected, entry.signature)
+
+    def verify_chain(self) -> tuple[bool, list[str]]:
+        """Verify the integrity of the entire audit log.
+
+        Returns:
+            Tuple of ``(all_valid, list_of_tampered_entry_ids)``.
+        """
+        tampered: list[str] = []
+        for entry in self._entries:
+            if not self.verify_entry(entry):
+                tampered.append(entry.entry_id)
+
+        if tampered:
+            logger.error("Audit log integrity violation: {} tampered entries", len(tampered))
+        else:
+            logger.info("Audit log integrity verified: {} entries OK", len(self._entries))
+
+        return len(tampered) == 0, tampered
+
+    def export_jsonl(self, file_path: str) -> int:
+        """Export all audit entries to a JSON Lines file.
+
+        Args:
+            file_path: Output file path.
+
+        Returns:
+            Number of entries exported.
+        """
+        with open(file_path, "w", encoding="utf-8") as f:
+            for entry in self._entries:
+                f.write(json.dumps(asdict(entry)) + "\n")
+        logger.info("Exported {} audit entries to '{}'", len(self._entries), file_path)
+        return len(self._entries)
+
+    def query(
+        self,
+        event_type: str | None = None,
+        actor: str | None = None,
+        limit: int = 100,
+    ) -> list[AuditEntry]:
+        """Query audit entries with optional filters.
+
+        Args:
+            event_type: Filter by event type.
+            actor: Filter by actor.
+            limit: Maximum number of results to return.
+
+        Returns:
+            Matching entries (most recent first), up to ``limit``.
+        """
+        results = [
+            e for e in reversed(self._entries)
+            if (event_type is None or e.event_type == event_type)
+            and (actor is None or e.actor == actor)
+        ]
+        return results[:limit]
+
+    def _sign(self, entry: AuditEntry) -> str:
+        """Compute the HMAC-SHA256 signature for an entry.
+
+        The signature covers all fields except ``signature`` itself.
+
+        Args:
+            entry: Entry to sign.
+
+        Returns:
+            Hex-encoded HMAC-SHA256 digest.
+        """
+        payload = json.dumps(
+            {
+                k: v for k, v in asdict(entry).items() if k != "signature"
+            },
+            sort_keys=True,
+            default=str,
+        ).encode()
+        return hmac.new(self._hmac_key, payload, hashlib.sha256).hexdigest()
+
+    @property
+    def entry_count(self) -> int:
+        """Total number of logged entries."""
+        return len(self._entries)
diff --git a/devsecops/audit/compliance_reporter.py b/devsecops/audit/compliance_reporter.py
new file mode 100644
index 0000000..6b49558
--- /dev/null
+++ b/devsecops/audit/compliance_reporter.py
@@ -0,0 +1,347 @@
+"""Regulatory compliance reporting for trading platform audits."""
+
+from __future__ import annotations
+
+import json
+from dataclasses import asdict, dataclass, field
+from datetime import datetime, date, timezone
+from typing import Any
+
+from loguru import logger
+
+
+@dataclass
+class ReportPeriod:
+    """Date range for a compliance report.
+
+    Attributes:
+        start: Inclusive start date.
+        end: Inclusive end date.
+    """
+
+    start: date
+    end: date
+
+    def __post_init__(self) -> None:
+        """Validate that start ≤ end."""
+        if self.start > self.end:
+            raise ValueError(f"start {self.start} must not be after end {self.end}")
+
+    @property
+    def days(self) -> int:
+        """Number of days in the period."""
+        return (self.end - self.start).days + 1
+
+
+@dataclass
+class ComplianceReport:
+    """A generated regulatory compliance report.
+
+    Attributes:
+        report_id: Unique identifier.
+        regulation: Target regulation (e.g. ``"FINRA"``, ``"MiFID2"``).
+        period: Reporting period.
+        entity_id: Regulated entity identifier.
+        sections: Named report sections with their content.
+        findings: List of compliance findings/issues.
+        attestation: Attestation statement.
+        generated_at: UTC generation timestamp.
+        status: ``"DRAFT"`` or ``"FINAL"``.
+    """
+
+    report_id: str
+    regulation: str
+    period: ReportPeriod
+    entity_id: str
+    sections: dict[str, Any]
+    findings: list[dict[str, Any]]
+    attestation: str
+    generated_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    status: str = "DRAFT"
+
+
+class ComplianceReporter:
+    """Regulatory report generation for trading compliance obligations.
+
+    Generates structured compliance reports for FINRA, MiFID2, and
+    other regulatory frameworks based on audit log and trade data.
+
+    Attributes:
+        generated_reports: All generated reports keyed by report_id.
+        _report_counter: Report ID counter.
+    """
+
+    _SUPPORTED_REGULATIONS: set[str] = {"FINRA", "MiFID2", "SOX", "GDPR", "SEC"}
+
+    def __init__(self) -> None:
+        """Initialise the compliance reporter."""
+        self.generated_reports: dict[str, ComplianceReport] = {}
+        self._report_counter = 0
+        logger.info("ComplianceReporter initialised")
+
+    def generate_finra_report(
+        self,
+        entity_id: str,
+        period: ReportPeriod,
+        trade_data: list[dict[str, Any]],
+        audit_events: list[dict[str, Any]],
+    ) -> ComplianceReport:
+        """Generate a FINRA compliance report.
+
+        Args:
+            entity_id: Regulated entity identifier.
+            period: Reporting period.
+            trade_data: Trade execution records for the period.
+            audit_events: Audit log entries for the period.
+
+        Returns:
+            Generated :class:`ComplianceReport`.
+        """
+        report_id = self._next_report_id("FINRA")
+        total_trades = len(trade_data)
+        total_value = sum(
+            t.get("quantity", 0) * t.get("price", 0) for t in trade_data
+        )
+
+        sections = {
+            "executive_summary": {
+                "entity": entity_id,
+                "period": f"{period.start} to {period.end}",
+                "total_trades": total_trades,
+                "total_notional_value": round(total_value, 2),
+                "reporting_obligation": "FINRA Rule 4511 Books and Records",
+            },
+            "trade_activity": self._summarise_trades(trade_data),
+            "best_execution": self._best_execution_analysis(trade_data),
+            "supervisory_controls": {
+                "audit_events_reviewed": len(audit_events),
+                "anomalies_detected": sum(
+                    1 for e in audit_events if e.get("outcome") == "FAILURE"
+                ),
+            },
+            "record_retention": {
+                "records_retained_days": period.days,
+                "meets_6_year_requirement": period.days <= 365 * 6,
+            },
+        }
+
+        findings = self._identify_finra_findings(trade_data, audit_events)
+        report = ComplianceReport(
+            report_id=report_id,
+            regulation="FINRA",
+            period=period,
+            entity_id=entity_id,
+            sections=sections,
+            findings=findings,
+            attestation=(
+                f"This report was generated automatically for {entity_id}. "
+                "Manual review and attestation by a compliance officer is required "
+                "before submission."
+            ),
+        )
+        self.generated_reports[report_id] = report
+        logger.info("FINRA report generated: {} ({})", report_id, period)
+        return report
+
+    def generate_mifid2_report(
+        self,
+        entity_id: str,
+        period: ReportPeriod,
+        trade_data: list[dict[str, Any]],
+    ) -> ComplianceReport:
+        """Generate a MiFID2 transaction reporting summary.
+
+        Args:
+            entity_id: Entity identifier.
+            period: Reporting period.
+            trade_data: Trade execution records.
+
+        Returns:
+            Generated :class:`ComplianceReport`.
+        """
+        report_id = self._next_report_id("MiFID2")
+        sections = {
+            "transaction_report": self._summarise_trades(trade_data),
+            "best_execution_policy": {
+                "total_executions": len(trade_data),
+                "venues": list({t.get("venue", "unknown") for t in trade_data}),
+            },
+            "pre_trade_transparency": {
+                "orders_displayed": len(trade_data),
+                "waivers_applied": 0,
+            },
+            "post_trade_transparency": {
+                "reports_submitted": len(trade_data),
+                "deferrals": 0,
+            },
+        }
+
+        report = ComplianceReport(
+            report_id=report_id,
+            regulation="MiFID2",
+            period=period,
+            entity_id=entity_id,
+            sections=sections,
+            findings=[],
+            attestation=(
+                f"MiFID2 transaction report for {entity_id}. "
+                "Requires review by compliance officer before regulatory submission."
+            ),
+        )
+        self.generated_reports[report_id] = report
+        logger.info("MiFID2 report generated: {} ({})", report_id, period)
+        return report
+
+    def export_json(self, report_id: str) -> str:
+        """Export a report as a formatted JSON string.
+
+        Args:
+            report_id: Report identifier.
+
+        Returns:
+            JSON string representation of the report.
+
+        Raises:
+            KeyError: If ``report_id`` is not found.
+        """
+        if report_id not in self.generated_reports:
+            raise KeyError(f"Report '{report_id}' not found")
+
+        report = self.generated_reports[report_id]
+        data = {
+            "report_id": report.report_id,
+            "regulation": report.regulation,
+            "period": {"start": str(report.period.start), "end": str(report.period.end)},
+            "entity_id": report.entity_id,
+            "sections": report.sections,
+            "findings": report.findings,
+            "attestation": report.attestation,
+            "generated_at": report.generated_at.isoformat(),
+            "status": report.status,
+        }
+        return json.dumps(data, indent=2, default=str)
+
+    def finalise(self, report_id: str, officer_name: str) -> ComplianceReport:
+        """Mark a report as FINAL with officer attestation.
+
+        Args:
+            report_id: Report to finalise.
+            officer_name: Name of the attesting compliance officer.
+
+        Returns:
+            Updated :class:`ComplianceReport`.
+
+        Raises:
+            KeyError: If report not found.
+        """
+        if report_id not in self.generated_reports:
+            raise KeyError(f"Report '{report_id}' not found")
+
+        report = self.generated_reports[report_id]
+        report.status = "FINAL"
+        report.attestation += f"\n\nAttestation by: {officer_name} on {datetime.now(timezone.utc).isoformat()}"
+        logger.info("Report {} finalised by {}", report_id, officer_name)
+        return report
+
+    def _next_report_id(self, regulation: str) -> str:
+        """Generate the next report identifier.
+
+        Args:
+            regulation: Regulation prefix.
+
+        Returns:
+            Report ID string.
+        """
+        self._report_counter += 1
+        ts = datetime.now(timezone.utc).strftime("%Y%m%d")
+        return f"{regulation}-{ts}-{self._report_counter:04d}"
+
+    @staticmethod
+    def _summarise_trades(trades: list[dict[str, Any]]) -> dict[str, Any]:
+        """Summarise trade data for report sections.
+
+        Args:
+            trades: Trade records.
+
+        Returns:
+            Summary dictionary.
+        """
+        if not trades:
+            return {"count": 0, "total_value": 0.0, "symbols": []}
+
+        symbols = list({t.get("symbol", "unknown") for t in trades})
+        total_value = sum(t.get("quantity", 0) * t.get("price", 0) for t in trades)
+        buy_count = sum(1 for t in trades if t.get("direction", "").upper() == "BUY")
+        sell_count = len(trades) - buy_count
+
+        return {
+            "count": len(trades),
+            "total_value": round(total_value, 2),
+            "symbols": symbols,
+            "buy_count": buy_count,
+            "sell_count": sell_count,
+        }
+
+    @staticmethod
+    def _best_execution_analysis(trades: list[dict[str, Any]]) -> dict[str, Any]:
+        """Analyse best execution quality.
+
+        Args:
+            trades: Trade records with optional ``"slippage"`` field.
+
+        Returns:
+            Best execution metrics.
+        """
+        slippages = [t.get("slippage", 0.0) for t in trades]
+        if not slippages:
+            return {"mean_slippage": 0.0, "max_slippage": 0.0}
+
+        import numpy as np
+        return {
+            "mean_slippage": round(float(np.mean(slippages)), 6),
+            "max_slippage": round(float(np.max(slippages)), 6),
+            "trades_with_positive_slippage": sum(1 for s in slippages if s > 0),
+        }
+
+    @staticmethod
+    def _identify_finra_findings(
+        trades: list[dict[str, Any]],
+        audit_events: list[dict[str, Any]],
+    ) -> list[dict[str, Any]]:
+        """Identify potential FINRA compliance findings.
+
+        Args:
+            trades: Trade records.
+            audit_events: Audit log entries.
+
+        Returns:
+            List of finding dictionaries.
+        """
+        findings: list[dict[str, Any]] = []
+
+        # Check for large trades without pre-approval
+        large_trades = [
+            t for t in trades
+            if t.get("quantity", 0) * t.get("price", 0) > 1_000_000
+            and not t.get("pre_approved", False)
+        ]
+        if large_trades:
+            findings.append({
+                "finding_id": "FINRA-001",
+                "description": f"{len(large_trades)} large trade(s) without pre-approval",
+                "severity": "HIGH",
+                "trade_ids": [t.get("trade_id") for t in large_trades[:5]],
+            })
+
+        # Check for after-hours trades
+        after_hours = [
+            t for t in trades if t.get("after_hours", False)
+        ]
+        if after_hours:
+            findings.append({
+                "finding_id": "FINRA-002",
+                "description": f"{len(after_hours)} after-hours trade(s) detected",
+                "severity": "MEDIUM",
+            })
+
+        return findings
diff --git a/devsecops/audit/trade_logger.py b/devsecops/audit/trade_logger.py
new file mode 100644
index 0000000..73498cc
--- /dev/null
+++ b/devsecops/audit/trade_logger.py
@@ -0,0 +1,283 @@
+"""Trading activity log with PnL tracking."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class TradeDirection(Enum):
+    """Trade direction."""
+
+    BUY = auto()
+    SELL = auto()
+
+
+class TradeStatus(Enum):
+    """Settlement status of a trade."""
+
+    PENDING = auto()
+    FILLED = auto()
+    PARTIALLY_FILLED = auto()
+    CANCELLED = auto()
+    REJECTED = auto()
+
+
+@dataclass
+class TradeRecord:
+    """A single trade activity record.
+
+    Attributes:
+        trade_id: Unique trade identifier.
+        symbol: Instrument symbol.
+        direction: BUY or SELL.
+        quantity: Number of units traded.
+        price: Execution price.
+        status: Settlement status.
+        strategy_id: Owning strategy identifier.
+        account_id: Trading account identifier.
+        commission: Brokerage commission in base currency.
+        slippage: Slippage in price units.
+        executed_at: UTC execution timestamp.
+        notes: Optional free-text notes.
+    """
+
+    trade_id: str
+    symbol: str
+    direction: TradeDirection
+    quantity: float
+    price: float
+    status: TradeStatus
+    strategy_id: str = ""
+    account_id: str = ""
+    commission: float = 0.0
+    slippage: float = 0.0
+    executed_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    notes: str = ""
+
+    @property
+    def notional_value(self) -> float:
+        """Notional trade value (quantity × price)."""
+        return self.quantity * self.price
+
+    @property
+    def net_cost(self) -> float:
+        """Net cost including commission."""
+        sign = 1.0 if self.direction == TradeDirection.BUY else -1.0
+        return sign * self.notional_value + self.commission
+
+
+@dataclass
+class PnLSnapshot:
+    """Profit and loss snapshot at a point in time.
+
+    Attributes:
+        account_id: Account identifier.
+        realised_pnl: Realised P&L for closed positions.
+        unrealised_pnl: Unrealised P&L on open positions.
+        total_pnl: Sum of realised and unrealised.
+        trade_count: Number of trades contributing.
+        commission_total: Total commission paid.
+        snapshot_at: UTC timestamp.
+    """
+
+    account_id: str
+    realised_pnl: float
+    unrealised_pnl: float
+    total_pnl: float
+    trade_count: int
+    commission_total: float
+    snapshot_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class TradeLogger:
+    """Trading activity log with P&L tracking and position management.
+
+    Records all trade executions and computes realised/unrealised P&L
+    using a FIFO position model.
+
+    Attributes:
+        trades: All trade records keyed by trade_id.
+        _positions: Current open positions per account/symbol (FIFO queue).
+        _realised_pnl: Cumulative realised P&L per account.
+        _commission_totals: Cumulative commissions per account.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the trade logger."""
+        self.trades: dict[str, TradeRecord] = {}
+        self._positions: dict[str, list[dict[str, float]]] = {}
+        self._realised_pnl: dict[str, float] = {}
+        self._commission_totals: dict[str, float] = {}
+        self._trade_counter = 0
+        logger.info("TradeLogger initialised")
+
+    def log_trade(
+        self,
+        symbol: str,
+        direction: TradeDirection,
+        quantity: float,
+        price: float,
+        status: TradeStatus = TradeStatus.FILLED,
+        strategy_id: str = "",
+        account_id: str = "default",
+        commission: float = 0.0,
+        slippage: float = 0.0,
+        notes: str = "",
+    ) -> TradeRecord:
+        """Record a trade execution.
+
+        Args:
+            symbol: Instrument symbol.
+            direction: BUY or SELL.
+            quantity: Units traded.
+            price: Execution price.
+            status: Trade settlement status.
+            strategy_id: Owning strategy.
+            account_id: Trading account.
+            commission: Brokerage commission.
+            slippage: Execution slippage.
+            notes: Optional notes.
+
+        Returns:
+            The created :class:`TradeRecord`.
+
+        Raises:
+            ValueError: If ``quantity`` or ``price`` are non-positive.
+        """
+        if quantity <= 0:
+            raise ValueError(f"quantity must be positive, got {quantity}")
+        if price <= 0:
+            raise ValueError(f"price must be positive, got {price}")
+
+        self._trade_counter += 1
+        trade_id = f"TRADE-{self._trade_counter:010d}"
+        record = TradeRecord(
+            trade_id=trade_id,
+            symbol=symbol,
+            direction=direction,
+            quantity=quantity,
+            price=price,
+            status=status,
+            strategy_id=strategy_id,
+            account_id=account_id,
+            commission=commission,
+            slippage=slippage,
+            notes=notes,
+        )
+        self.trades[trade_id] = record
+
+        if status == TradeStatus.FILLED:
+            self._update_position(record)
+
+        self._commission_totals[account_id] = (
+            self._commission_totals.get(account_id, 0.0) + commission
+        )
+        logger.info(
+            "Trade {}: {} {} {} @ {:.4f} (account={})",
+            trade_id,
+            direction.name,
+            quantity,
+            symbol,
+            price,
+            account_id,
+        )
+        return record
+
+    def _update_position(self, trade: TradeRecord) -> None:
+        """Update FIFO position model with a new fill.
+
+        Args:
+            trade: Filled trade record.
+        """
+        key = f"{trade.account_id}:{trade.symbol}"
+        if key not in self._positions:
+            self._positions[key] = []
+
+        if trade.direction == TradeDirection.BUY:
+            self._positions[key].append({"qty": trade.quantity, "cost": trade.price})
+        else:
+            qty_to_close = trade.quantity
+            realised = 0.0
+            while qty_to_close > 0 and self._positions[key]:
+                lot = self._positions[key][0]
+                fill = min(lot["qty"], qty_to_close)
+                realised += fill * (trade.price - lot["cost"])
+                lot["qty"] -= fill
+                qty_to_close -= fill
+                if lot["qty"] <= 1e-10:
+                    self._positions[key].pop(0)
+
+            account = trade.account_id
+            self._realised_pnl[account] = self._realised_pnl.get(account, 0.0) + realised
+
+    def pnl_snapshot(
+        self,
+        account_id: str = "default",
+        current_prices: dict[str, float] | None = None,
+    ) -> PnLSnapshot:
+        """Compute a P&L snapshot for an account.
+
+        Args:
+            account_id: Account to snapshot.
+            current_prices: Current mark-to-market prices per symbol.
+
+        Returns:
+            :class:`PnLSnapshot` with realised and unrealised P&L.
+        """
+        realised = self._realised_pnl.get(account_id, 0.0)
+        commission_total = self._commission_totals.get(account_id, 0.0)
+        unrealised = 0.0
+
+        if current_prices:
+            for key, lots in self._positions.items():
+                acc, symbol = key.split(":", 1)
+                if acc != account_id:
+                    continue
+                current = current_prices.get(symbol)
+                if current is not None:
+                    for lot in lots:
+                        unrealised += lot["qty"] * (current - lot["cost"])
+
+        trade_count = sum(
+            1 for t in self.trades.values()
+            if t.account_id == account_id and t.status == TradeStatus.FILLED
+        )
+
+        return PnLSnapshot(
+            account_id=account_id,
+            realised_pnl=round(realised, 4),
+            unrealised_pnl=round(unrealised, 4),
+            total_pnl=round(realised + unrealised, 4),
+            trade_count=trade_count,
+            commission_total=round(commission_total, 4),
+        )
+
+    def get_trades(
+        self,
+        account_id: str | None = None,
+        symbol: str | None = None,
+        strategy_id: str | None = None,
+    ) -> list[TradeRecord]:
+        """Retrieve filtered trade records.
+
+        Args:
+            account_id: Filter by account.
+            symbol: Filter by symbol.
+            strategy_id: Filter by strategy.
+
+        Returns:
+            Matching :class:`TradeRecord` list (most recent first).
+        """
+        results = [
+            t for t in self.trades.values()
+            if (account_id is None or t.account_id == account_id)
+            and (symbol is None or t.symbol == symbol)
+            and (strategy_id is None or t.strategy_id == strategy_id)
+        ]
+        return sorted(results, key=lambda t: t.executed_at, reverse=True)
diff --git a/devsecops/cicd/__init__.py b/devsecops/cicd/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/devsecops/cicd/__pycache__/__init__.cpython-312.pyc b/devsecops/cicd/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..44442aa
Binary files /dev/null and b/devsecops/cicd/__pycache__/__init__.cpython-312.pyc differ
diff --git a/devsecops/cicd/__pycache__/build_pipeline.cpython-312.pyc b/devsecops/cicd/__pycache__/build_pipeline.cpython-312.pyc
new file mode 100644
index 0000000..f79576f
Binary files /dev/null and b/devsecops/cicd/__pycache__/build_pipeline.cpython-312.pyc differ
diff --git a/devsecops/cicd/__pycache__/deployment_gates.cpython-312.pyc b/devsecops/cicd/__pycache__/deployment_gates.cpython-312.pyc
new file mode 100644
index 0000000..da4cb80
Binary files /dev/null and b/devsecops/cicd/__pycache__/deployment_gates.cpython-312.pyc differ
diff --git a/devsecops/cicd/__pycache__/rollback_mechanism.cpython-312.pyc b/devsecops/cicd/__pycache__/rollback_mechanism.cpython-312.pyc
new file mode 100644
index 0000000..3c2f2bb
Binary files /dev/null and b/devsecops/cicd/__pycache__/rollback_mechanism.cpython-312.pyc differ
diff --git a/devsecops/cicd/__pycache__/test_automation.cpython-312.pyc b/devsecops/cicd/__pycache__/test_automation.cpython-312.pyc
new file mode 100644
index 0000000..7a7d359
Binary files /dev/null and b/devsecops/cicd/__pycache__/test_automation.cpython-312.pyc differ
diff --git a/devsecops/cicd/build_pipeline.py b/devsecops/cicd/build_pipeline.py
new file mode 100644
index 0000000..4a028b5
--- /dev/null
+++ b/devsecops/cicd/build_pipeline.py
@@ -0,0 +1,241 @@
+"""Automated build pipeline orchestration with stages and security gates."""
+
+from __future__ import annotations
+
+import asyncio
+import time
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any, Callable, Awaitable
+
+from loguru import logger
+
+
+class StageStatus(Enum):
+    """Status of a pipeline stage."""
+
+    PENDING = auto()
+    RUNNING = auto()
+    PASSED = auto()
+    FAILED = auto()
+    SKIPPED = auto()
+
+
+@dataclass
+class PipelineStage:
+    """A single build pipeline stage.
+
+    Attributes:
+        name: Stage name.
+        handler: Async callable that executes the stage.
+        required: If ``True``, failure blocks subsequent stages.
+        timeout_s: Maximum execution time in seconds.
+    """
+
+    name: str
+    handler: Callable[[dict[str, Any]], Awaitable[dict[str, Any]]]
+    required: bool = True
+    timeout_s: float = 300.0
+
+
+@dataclass
+class StageResult:
+    """Result of a single pipeline stage execution.
+
+    Attributes:
+        stage_name: Name of the executed stage.
+        status: Execution outcome.
+        output: Stage output data.
+        duration_ms: Execution time.
+        error: Error message if failed.
+        started_at: UTC start timestamp.
+    """
+
+    stage_name: str
+    status: StageStatus
+    output: dict[str, Any] = field(default_factory=dict)
+    duration_ms: float = 0.0
+    error: str = ""
+    started_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class BuildResult:
+    """Aggregated result of a full build pipeline run.
+
+    Attributes:
+        build_id: Unique build identifier.
+        pipeline_name: Name of the pipeline.
+        overall_status: Aggregate pass/fail status.
+        stage_results: Ordered stage results.
+        total_duration_ms: Total pipeline duration.
+        completed_at: UTC completion timestamp.
+    """
+
+    build_id: str
+    pipeline_name: str
+    overall_status: StageStatus
+    stage_results: list[StageResult]
+    total_duration_ms: float
+    completed_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class BuildPipeline:
+    """Automated build orchestration with ordered stages and security gates.
+
+    Stages are executed sequentially; a required stage failure halts
+    subsequent stages.
+
+    Attributes:
+        stages: Ordered list of pipeline stages.
+        build_history: Log of completed build results.
+    """
+
+    def __init__(self, name: str = "trading-platform") -> None:
+        """Initialise the build pipeline.
+
+        Args:
+            name: Pipeline name for identification.
+        """
+        self.name = name
+        self.stages: list[PipelineStage] = []
+        self.build_history: list[BuildResult] = []
+        self._build_counter = 0
+        logger.info("BuildPipeline '{}' initialised", name)
+
+    def add_stage(
+        self,
+        name: str,
+        handler: Callable[[dict[str, Any]], Awaitable[dict[str, Any]]],
+        required: bool = True,
+        timeout_s: float = 300.0,
+    ) -> None:
+        """Add a stage to the pipeline.
+
+        Args:
+            name: Stage name.
+            handler: Async callable receiving context dict, returning result dict.
+            required: Whether failure should halt the pipeline.
+            timeout_s: Stage execution timeout.
+        """
+        self.stages.append(PipelineStage(name=name, handler=handler, required=required, timeout_s=timeout_s))
+        logger.debug("Stage '{}' added to pipeline '{}'", name, self.name)
+
+    async def run(self, context: dict[str, Any] | None = None) -> BuildResult:
+        """Execute the pipeline.
+
+        Args:
+            context: Initial context data passed to all stages.
+
+        Returns:
+            :class:`BuildResult` with all stage outcomes.
+        """
+        self._build_counter += 1
+        build_id = f"build_{self._build_counter:06d}"
+        context = dict(context or {})
+        pipeline_start = time.monotonic()
+        stage_results: list[StageResult] = []
+        overall_status = StageStatus.PASSED
+        halted = False
+
+        logger.info("Build {} starting: '{}' ({} stages)", build_id, self.name, len(self.stages))
+
+        for stage in self.stages:
+            if halted:
+                stage_results.append(StageResult(
+                    stage_name=stage.name,
+                    status=StageStatus.SKIPPED,
+                ))
+                continue
+
+            result = await self._execute_stage(stage, context)
+            stage_results.append(result)
+            context.update(result.output)
+
+            if result.status == StageStatus.FAILED:
+                if stage.required:
+                    overall_status = StageStatus.FAILED
+                    halted = True
+                    logger.error("Required stage '{}' failed — pipeline halted", stage.name)
+
+        total_ms = (time.monotonic() - pipeline_start) * 1000
+        build = BuildResult(
+            build_id=build_id,
+            pipeline_name=self.name,
+            overall_status=overall_status,
+            stage_results=stage_results,
+            total_duration_ms=round(total_ms, 2),
+        )
+        self.build_history.append(build)
+        log = logger.info if overall_status == StageStatus.PASSED else logger.error
+        log("Build {} {}: {} stages, {:.0f}ms", build_id, overall_status.name, len(stage_results), total_ms)
+        return build
+
+    async def _execute_stage(
+        self,
+        stage: PipelineStage,
+        context: dict[str, Any],
+    ) -> StageResult:
+        """Execute a single pipeline stage with timeout handling.
+
+        Args:
+            stage: Stage specification.
+            context: Current pipeline context.
+
+        Returns:
+            :class:`StageResult`.
+        """
+        start = time.monotonic()
+        started_at = datetime.now(timezone.utc)
+        logger.info("Stage '{}' starting", stage.name)
+
+        try:
+            output = await asyncio.wait_for(stage.handler(context), timeout=stage.timeout_s)
+            duration_ms = (time.monotonic() - start) * 1000
+            return StageResult(
+                stage_name=stage.name,
+                status=StageStatus.PASSED,
+                output=output or {},
+                duration_ms=round(duration_ms, 2),
+                started_at=started_at,
+            )
+        except asyncio.TimeoutError:
+            duration_ms = (time.monotonic() - start) * 1000
+            logger.error("Stage '{}' timed out after {}s", stage.name, stage.timeout_s)
+            return StageResult(
+                stage_name=stage.name,
+                status=StageStatus.FAILED,
+                duration_ms=round(duration_ms, 2),
+                error=f"Timeout after {stage.timeout_s}s",
+                started_at=started_at,
+            )
+        except Exception as exc:
+            duration_ms = (time.monotonic() - start) * 1000
+            logger.error("Stage '{}' failed: {}", stage.name, exc)
+            return StageResult(
+                stage_name=stage.name,
+                status=StageStatus.FAILED,
+                duration_ms=round(duration_ms, 2),
+                error=str(exc),
+                started_at=started_at,
+            )
+
+    @staticmethod
+    def make_simulated_stage(name: str, should_fail: bool = False) -> Callable:
+        """Factory for a simulated stage handler.
+
+        Args:
+            name: Stage name for labelling.
+            should_fail: Whether to simulate a failure.
+
+        Returns:
+            Async stage handler callable.
+        """
+        async def _handler(context: dict[str, Any]) -> dict[str, Any]:
+            await asyncio.sleep(0)
+            if should_fail:
+                raise RuntimeError(f"Simulated failure in stage '{name}'")
+            return {f"{name}_passed": True}
+
+        return _handler
diff --git a/devsecops/cicd/deployment_gates.py b/devsecops/cicd/deployment_gates.py
new file mode 100644
index 0000000..45105c8
--- /dev/null
+++ b/devsecops/cicd/deployment_gates.py
@@ -0,0 +1,204 @@
+"""Security deployment gates: checkpoints before production deployment."""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any, Callable, Awaitable
+
+from loguru import logger
+
+
+class GateStatus(Enum):
+    """Status of a deployment gate evaluation."""
+
+    OPEN = auto()    # Gate passed
+    BLOCKED = auto() # Gate failed
+    SKIPPED = auto() # Gate not applicable
+    ERROR = auto()   # Gate evaluation error
+
+
+@dataclass
+class GateResult:
+    """Result of a single deployment gate evaluation.
+
+    Attributes:
+        gate_name: Name of the gate.
+        status: Evaluation outcome.
+        message: Human-readable result description.
+        details: Supplementary data.
+        evaluated_at: UTC timestamp.
+    """
+
+    gate_name: str
+    status: GateStatus
+    message: str
+    details: dict[str, Any] = field(default_factory=dict)
+    evaluated_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class DeploymentDecision:
+    """Final deployment go/no-go decision.
+
+    Attributes:
+        deployment_id: Identifier of the deployment being evaluated.
+        approved: Whether deployment is approved.
+        gate_results: Results for all evaluated gates.
+        blocking_gates: Names of gates that blocked deployment.
+        evaluated_at: UTC timestamp.
+    """
+
+    deployment_id: str
+    approved: bool
+    gate_results: list[GateResult]
+    blocking_gates: list[str]
+    evaluated_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class DeploymentGates:
+    """Security checkpoints evaluated before production deployment.
+
+    Gates are composed async functions that inspect a deployment context
+    and return pass/fail decisions.  All required gates must pass for
+    a deployment to be approved.
+
+    Attributes:
+        gates: Registered gate functions.
+        evaluation_history: All past deployment decisions.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the deployment gates with built-in checks."""
+        self.gates: dict[str, Callable[[dict[str, Any]], Awaitable[GateResult]]] = {}
+        self.evaluation_history: list[DeploymentDecision] = []
+        self._register_default_gates()
+        logger.info("DeploymentGates initialised ({} default gates)", len(self.gates))
+
+    def register_gate(
+        self,
+        name: str,
+        gate_fn: Callable[[dict[str, Any]], Awaitable[GateResult]],
+    ) -> None:
+        """Register a custom deployment gate.
+
+        Args:
+            name: Unique gate name.
+            gate_fn: Async callable ``(context) → GateResult``.
+        """
+        self.gates[name] = gate_fn
+        logger.debug("Deployment gate '{}' registered", name)
+
+    async def evaluate(
+        self,
+        deployment_id: str,
+        context: dict[str, Any],
+        gate_names: list[str] | None = None,
+    ) -> DeploymentDecision:
+        """Evaluate all (or specified) gates for a deployment.
+
+        Args:
+            deployment_id: Deployment identifier.
+            context: Deployment context (build results, scan results, etc.).
+            gate_names: Subset of gate names to evaluate; all if None.
+
+        Returns:
+            :class:`DeploymentDecision` with go/no-go verdict.
+        """
+        targets = gate_names or list(self.gates.keys())
+        results: list[GateResult] = []
+
+        for gate_name in targets:
+            gate_fn = self.gates.get(gate_name)
+            if gate_fn is None:
+                results.append(GateResult(
+                    gate_name=gate_name,
+                    status=GateStatus.ERROR,
+                    message=f"Gate '{gate_name}' not registered",
+                ))
+                continue
+            try:
+                result = await gate_fn(context)
+            except Exception as exc:
+                logger.error("Gate '{}' evaluation error: {}", gate_name, exc)
+                result = GateResult(
+                    gate_name=gate_name,
+                    status=GateStatus.ERROR,
+                    message=str(exc),
+                )
+            results.append(result)
+
+        blocking = [
+            r.gate_name for r in results
+            if r.status in (GateStatus.BLOCKED, GateStatus.ERROR)
+        ]
+        approved = len(blocking) == 0
+
+        decision = DeploymentDecision(
+            deployment_id=deployment_id,
+            approved=approved,
+            gate_results=results,
+            blocking_gates=blocking,
+        )
+        self.evaluation_history.append(decision)
+        log = logger.info if approved else logger.error
+        log(
+            "Deployment '{}': {} ({} gates, {} blocking)",
+            deployment_id,
+            "APPROVED" if approved else "BLOCKED",
+            len(results),
+            len(blocking),
+        )
+        return decision
+
+    def _register_default_gates(self) -> None:
+        """Register built-in security gates."""
+
+        async def no_critical_vulns(ctx: dict[str, Any]) -> GateResult:
+            critical = ctx.get("critical_vulnerabilities", 0)
+            passed = critical == 0
+            return GateResult(
+                gate_name="no_critical_vulnerabilities",
+                status=GateStatus.OPEN if passed else GateStatus.BLOCKED,
+                message=f"Critical vulnerabilities: {critical}",
+                details={"critical_count": critical},
+            )
+
+        async def sast_passed(ctx: dict[str, Any]) -> GateResult:
+            passed = ctx.get("sast_passed", True)
+            return GateResult(
+                gate_name="sast_passed",
+                status=GateStatus.OPEN if passed else GateStatus.BLOCKED,
+                message="SAST scan passed" if passed else "SAST scan failed",
+            )
+
+        async def tests_passed(ctx: dict[str, Any]) -> GateResult:
+            coverage = ctx.get("test_coverage_pct", 100.0)
+            min_coverage = ctx.get("min_coverage_pct", 80.0)
+            passed = coverage >= min_coverage
+            return GateResult(
+                gate_name="test_coverage",
+                status=GateStatus.OPEN if passed else GateStatus.BLOCKED,
+                message=f"Coverage {coverage:.1f}% {'≥' if passed else '<'} {min_coverage:.1f}%",
+                details={"coverage_pct": coverage, "min_pct": min_coverage},
+            )
+
+        async def secrets_not_leaked(ctx: dict[str, Any]) -> GateResult:
+            secrets_found = ctx.get("secrets_detected", 0)
+            passed = secrets_found == 0
+            return GateResult(
+                gate_name="no_secrets_leaked",
+                status=GateStatus.OPEN if passed else GateStatus.BLOCKED,
+                message=f"Secrets detected: {secrets_found}",
+                details={"secrets_count": secrets_found},
+            )
+
+        for name, fn in [
+            ("no_critical_vulnerabilities", no_critical_vulns),
+            ("sast_passed", sast_passed),
+            ("test_coverage", tests_passed),
+            ("no_secrets_leaked", secrets_not_leaked),
+        ]:
+            self.gates[name] = fn
diff --git a/devsecops/cicd/rollback_mechanism.py b/devsecops/cicd/rollback_mechanism.py
new file mode 100644
index 0000000..ddc3054
--- /dev/null
+++ b/devsecops/cicd/rollback_mechanism.py
@@ -0,0 +1,275 @@
+"""Safe rollback mechanism with health checks for trading platform deployments."""
+
+from __future__ import annotations
+
+import asyncio
+import time
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any, Callable, Awaitable
+
+from loguru import logger
+
+
+class RollbackStatus(Enum):
+    """Status of a rollback operation."""
+
+    SUCCESS = auto()
+    FAILED = auto()
+    PARTIAL = auto()
+    IN_PROGRESS = auto()
+
+
+@dataclass
+class DeploymentSnapshot:
+    """Snapshot of a deployment that can be rolled back to.
+
+    Attributes:
+        snapshot_id: Unique identifier.
+        service_name: Service this snapshot belongs to.
+        version: Deployment version string.
+        config: Service configuration at the time of snapshot.
+        health_check_url: URL for health verification.
+        created_at: UTC creation timestamp.
+    """
+
+    snapshot_id: str
+    service_name: str
+    version: str
+    config: dict[str, Any]
+    health_check_url: str = ""
+    created_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class RollbackResult:
+    """Result of a rollback operation.
+
+    Attributes:
+        rollback_id: Unique identifier.
+        service_name: Service that was rolled back.
+        from_version: Version rolled back from.
+        to_version: Version rolled back to.
+        status: Rollback outcome.
+        health_verified: Whether health check passed post-rollback.
+        steps_completed: Number of rollback steps completed.
+        error: Error message if failed.
+        duration_ms: Total operation duration.
+        completed_at: UTC timestamp.
+    """
+
+    rollback_id: str
+    service_name: str
+    from_version: str
+    to_version: str
+    status: RollbackStatus
+    health_verified: bool
+    steps_completed: int
+    error: str = ""
+    duration_ms: float = 0.0
+    completed_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class RollbackMechanism:
+    """Safe rollback with health checks for trading platform deployments.
+
+    Manages deployment snapshots and orchestrates rollback procedures
+    with mandatory health verification at each step.
+
+    Attributes:
+        snapshots: Deployment snapshots keyed by snapshot_id.
+        rollback_history: All completed rollback results.
+        _health_checker: Optional async health check callable.
+    """
+
+    def __init__(
+        self,
+        health_checker: Callable[[str], Awaitable[bool]] | None = None,
+    ) -> None:
+        """Initialise the rollback mechanism.
+
+        Args:
+            health_checker: Async callable ``(url) → bool`` for health
+                verification.  Uses a simulated checker when ``None``.
+        """
+        self.snapshots: dict[str, DeploymentSnapshot] = {}
+        self.rollback_history: list[RollbackResult] = []
+        self._health_checker = health_checker or self._default_health_check
+        self._rollback_counter = 0
+        logger.info("RollbackMechanism initialised")
+
+    def capture_snapshot(
+        self,
+        service_name: str,
+        version: str,
+        config: dict[str, Any],
+        health_check_url: str = "",
+    ) -> DeploymentSnapshot:
+        """Capture a deployment snapshot for future rollback.
+
+        Args:
+            service_name: Service identifier.
+            version: Current deployment version.
+            config: Current service configuration.
+            health_check_url: Health check endpoint URL.
+
+        Returns:
+            The created :class:`DeploymentSnapshot`.
+        """
+        snapshot_id = f"snap_{service_name}_{version}_{int(time.time())}"
+        snapshot = DeploymentSnapshot(
+            snapshot_id=snapshot_id,
+            service_name=service_name,
+            version=version,
+            config=dict(config),
+            health_check_url=health_check_url,
+        )
+        self.snapshots[snapshot_id] = snapshot
+        logger.info("Snapshot captured: {} v{} (id={})", service_name, version, snapshot_id)
+        return snapshot
+
+    def get_latest_snapshot(self, service_name: str) -> DeploymentSnapshot | None:
+        """Get the most recent snapshot for a service.
+
+        Args:
+            service_name: Service identifier.
+
+        Returns:
+            Most recent :class:`DeploymentSnapshot` or ``None``.
+        """
+        service_snaps = [
+            s for s in self.snapshots.values()
+            if s.service_name == service_name
+        ]
+        if not service_snaps:
+            return None
+        return max(service_snaps, key=lambda s: s.created_at)
+
+    async def rollback(
+        self,
+        service_name: str,
+        current_version: str,
+        target_snapshot_id: str | None = None,
+        max_health_retries: int = 3,
+    ) -> RollbackResult:
+        """Execute a rollback for a service.
+
+        Args:
+            service_name: Service to roll back.
+            current_version: Currently deployed version.
+            target_snapshot_id: Snapshot to roll back to; uses the most
+                recent snapshot if ``None``.
+            max_health_retries: Health check retry count after rollback.
+
+        Returns:
+            :class:`RollbackResult` with outcome.
+
+        Raises:
+            RuntimeError: If no snapshot is available for the service.
+        """
+        self._rollback_counter += 1
+        rollback_id = f"rollback_{self._rollback_counter:06d}"
+        start = time.monotonic()
+
+        if target_snapshot_id:
+            snapshot = self.snapshots.get(target_snapshot_id)
+        else:
+            snapshot = self.get_latest_snapshot(service_name)
+
+        if snapshot is None:
+            raise RuntimeError(
+                f"No snapshot available for service '{service_name}'. "
+                "Capture a snapshot before attempting rollback."
+            )
+
+        logger.warning(
+            "Rollback {}: '{}' {} → {}",
+            rollback_id,
+            service_name,
+            current_version,
+            snapshot.version,
+        )
+
+        steps = 0
+        try:
+            # Step 1: Stop traffic to the current version
+            await self._stop_traffic(service_name, current_version)
+            steps += 1
+
+            # Step 2: Deploy the previous version
+            await self._deploy_version(service_name, snapshot)
+            steps += 1
+
+            # Step 3: Verify health
+            health_ok = False
+            for attempt in range(1, max_health_retries + 1):
+                health_ok = await self._health_checker(snapshot.health_check_url)
+                if health_ok:
+                    logger.info("Health check passed after rollback (attempt {})", attempt)
+                    break
+                logger.warning("Health check attempt {}/{} failed", attempt, max_health_retries)
+                await asyncio.sleep(0)
+
+            steps += 1
+            status = RollbackStatus.SUCCESS if health_ok else RollbackStatus.PARTIAL
+
+        except Exception as exc:
+            logger.error("Rollback {} failed at step {}: {}", rollback_id, steps + 1, exc)
+            status = RollbackStatus.FAILED
+            health_ok = False
+
+        duration_ms = (time.monotonic() - start) * 1000
+        result = RollbackResult(
+            rollback_id=rollback_id,
+            service_name=service_name,
+            from_version=current_version,
+            to_version=snapshot.version,
+            status=status,
+            health_verified=health_ok,
+            steps_completed=steps,
+            duration_ms=round(duration_ms, 2),
+        )
+        self.rollback_history.append(result)
+        log = logger.info if status == RollbackStatus.SUCCESS else logger.error
+        log(
+            "Rollback {} {}: {} → {} (health={})",
+            rollback_id,
+            status.name,
+            current_version,
+            snapshot.version,
+            health_ok,
+        )
+        return result
+
+    async def _stop_traffic(self, service_name: str, version: str) -> None:
+        """Simulate stopping traffic to a service version.
+
+        Args:
+            service_name: Service identifier.
+            version: Version to stop.
+        """
+        await asyncio.sleep(0)
+        logger.debug("Traffic stopped for '{}' v{}", service_name, version)
+
+    async def _deploy_version(self, service_name: str, snapshot: DeploymentSnapshot) -> None:
+        """Simulate deploying a snapshot version.
+
+        Args:
+            service_name: Service identifier.
+            snapshot: Snapshot to restore.
+        """
+        await asyncio.sleep(0)
+        logger.debug("Deploying '{}' v{} from snapshot {}", service_name, snapshot.version, snapshot.snapshot_id)
+
+    async def _default_health_check(self, url: str) -> bool:
+        """Simulated health check.
+
+        Args:
+            url: Health check URL (unused in simulation).
+
+        Returns:
+            Always ``True`` in simulation.
+        """
+        await asyncio.sleep(0)
+        return True
diff --git a/devsecops/cicd/test_automation.py b/devsecops/cicd/test_automation.py
new file mode 100644
index 0000000..4dcc141
--- /dev/null
+++ b/devsecops/cicd/test_automation.py
@@ -0,0 +1,244 @@
+"""Security testing automation runner for CI/CD pipelines."""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+from loguru import logger
+
+
+class TestType(Enum):
+    """Categories of security tests."""
+
+    SAST = auto()
+    DAST = auto()
+    DEPENDENCY_SCAN = auto()
+    CONTAINER_SCAN = auto()
+    SECRETS_SCAN = auto()
+    COMPLIANCE = auto()
+    PENETRATION = auto()
+
+
+@dataclass
+class SecurityTestResult:
+    """Result of a single security test run.
+
+    Attributes:
+        test_id: Unique identifier.
+        test_type: Category of test.
+        test_name: Human-readable name.
+        passed: Whether the test passed.
+        findings_count: Number of security findings.
+        critical_findings: Number of critical findings.
+        details: Supplementary result data.
+        duration_ms: Test execution time.
+        executed_at: UTC timestamp.
+    """
+
+    test_id: str
+    test_type: TestType
+    test_name: str
+    passed: bool
+    findings_count: int
+    critical_findings: int
+    details: dict[str, Any] = field(default_factory=dict)
+    duration_ms: float = 0.0
+    executed_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class TestSuiteResult:
+    """Aggregated result of a security test suite run.
+
+    Attributes:
+        suite_id: Unique identifier.
+        results: Individual test results.
+        passed_count: Tests that passed.
+        failed_count: Tests that failed.
+        total_critical_findings: Total critical findings across all tests.
+        overall_passed: Whether the suite passed.
+        duration_ms: Total suite duration.
+    """
+
+    suite_id: str
+    results: list[SecurityTestResult]
+    passed_count: int
+    failed_count: int
+    total_critical_findings: int
+    overall_passed: bool
+    duration_ms: float
+
+
+class TestAutomation:
+    """Security testing automation runner for CI/CD integration.
+
+    Orchestrates a suite of security tests and aggregates results
+    for use in deployment gate evaluations.
+
+    Attributes:
+        test_history: All completed suite results.
+        _registered_tests: Registered test functions.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the test automation runner."""
+        self.test_history: list[TestSuiteResult] = []
+        self._registered_tests: list[tuple[TestType, str, Any]] = []
+        self._suite_counter = 0
+        logger.info("TestAutomation runner initialised")
+
+    def register_test(
+        self,
+        test_type: TestType,
+        name: str,
+        test_fn: Any,
+    ) -> None:
+        """Register a security test function.
+
+        Args:
+            test_type: Category of test.
+            name: Human-readable test name.
+            test_fn: Async callable ``(context) → SecurityTestResult``.
+        """
+        self._registered_tests.append((test_type, name, test_fn))
+        logger.debug("Security test '{}' ({}) registered", name, test_type.name)
+
+    async def run_suite(
+        self,
+        context: dict[str, Any] | None = None,
+        test_types: list[TestType] | None = None,
+    ) -> TestSuiteResult:
+        """Execute all registered (or filtered) security tests.
+
+        Args:
+            context: Context data passed to each test.
+            test_types: If provided, only tests of these types are run.
+
+        Returns:
+            :class:`TestSuiteResult` aggregating all results.
+        """
+        import time
+        self._suite_counter += 1
+        suite_id = f"suite_{self._suite_counter:06d}"
+        context = context or {}
+        start = time.monotonic()
+
+        tests_to_run = [
+            (tt, name, fn)
+            for tt, name, fn in self._registered_tests
+            if test_types is None or tt in test_types
+        ]
+
+        if not tests_to_run:
+            # Run built-in simulated tests
+            tests_to_run = self._default_tests()
+
+        logger.info("Running security test suite {}: {} tests", suite_id, len(tests_to_run))
+        results: list[SecurityTestResult] = []
+
+        for test_type, name, test_fn in tests_to_run:
+            result = await self._run_test(test_type, name, test_fn, context)
+            results.append(result)
+
+        passed = sum(1 for r in results if r.passed)
+        failed = sum(1 for r in results if not r.passed)
+        critical = sum(r.critical_findings for r in results)
+        duration_ms = (time.monotonic() - start) * 1000
+
+        suite = TestSuiteResult(
+            suite_id=suite_id,
+            results=results,
+            passed_count=passed,
+            failed_count=failed,
+            total_critical_findings=critical,
+            overall_passed=critical == 0,
+            duration_ms=round(duration_ms, 2),
+        )
+        self.test_history.append(suite)
+        log = logger.info if suite.overall_passed else logger.error
+        log(
+            "Suite {}: {}/{} passed, {} critical findings",
+            suite_id,
+            passed,
+            len(results),
+            critical,
+        )
+        return suite
+
+    async def _run_test(
+        self,
+        test_type: TestType,
+        name: str,
+        test_fn: Any,
+        context: dict[str, Any],
+    ) -> SecurityTestResult:
+        """Execute a single test with timing.
+
+        Args:
+            test_type: Test category.
+            name: Test name.
+            test_fn: Async callable.
+            context: Test context.
+
+        Returns:
+            :class:`SecurityTestResult`.
+        """
+        import time
+        test_id = f"test_{hash(name) % 100000:05d}"
+        start = time.monotonic()
+
+        try:
+            result: SecurityTestResult = await test_fn(context)
+            result.duration_ms = round((time.monotonic() - start) * 1000, 2)
+            return result
+        except Exception as exc:
+            logger.error("Test '{}' raised: {}", name, exc)
+            return SecurityTestResult(
+                test_id=test_id,
+                test_type=test_type,
+                test_name=name,
+                passed=False,
+                findings_count=0,
+                critical_findings=1,
+                details={"error": str(exc)},
+                duration_ms=round((time.monotonic() - start) * 1000, 2),
+            )
+
+    def _default_tests(self) -> list[tuple[TestType, str, Any]]:
+        """Return a set of built-in simulated security tests.
+
+        Returns:
+            List of ``(TestType, name, handler)`` tuples.
+        """
+        async def sast_test(ctx: dict[str, Any]) -> SecurityTestResult:
+            await asyncio.sleep(0)
+            return SecurityTestResult(
+                test_id="sast_001",
+                test_type=TestType.SAST,
+                test_name="SAST Scan (simulated)",
+                passed=True,
+                findings_count=2,
+                critical_findings=0,
+                details={"tool": "simulated"},
+            )
+
+        async def dep_test(ctx: dict[str, Any]) -> SecurityTestResult:
+            await asyncio.sleep(0)
+            return SecurityTestResult(
+                test_id="dep_001",
+                test_type=TestType.DEPENDENCY_SCAN,
+                test_name="Dependency Scan (simulated)",
+                passed=True,
+                findings_count=1,
+                critical_findings=0,
+                details={"tool": "simulated"},
+            )
+
+        return [
+            (TestType.SAST, "SAST Scan", sast_test),
+            (TestType.DEPENDENCY_SCAN, "Dependency Scan", dep_test),
+        ]
diff --git a/devsecops/scanning/__init__.py b/devsecops/scanning/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/devsecops/scanning/__pycache__/__init__.cpython-312.pyc b/devsecops/scanning/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..19d17e5
Binary files /dev/null and b/devsecops/scanning/__pycache__/__init__.cpython-312.pyc differ
diff --git a/devsecops/scanning/__pycache__/api_scanner.cpython-312.pyc b/devsecops/scanning/__pycache__/api_scanner.cpython-312.pyc
new file mode 100644
index 0000000..ca6a2e5
Binary files /dev/null and b/devsecops/scanning/__pycache__/api_scanner.cpython-312.pyc differ
diff --git a/devsecops/scanning/__pycache__/code_scanner.cpython-312.pyc b/devsecops/scanning/__pycache__/code_scanner.cpython-312.pyc
new file mode 100644
index 0000000..59e5dab
Binary files /dev/null and b/devsecops/scanning/__pycache__/code_scanner.cpython-312.pyc differ
diff --git a/devsecops/scanning/__pycache__/container_scanner.cpython-312.pyc b/devsecops/scanning/__pycache__/container_scanner.cpython-312.pyc
new file mode 100644
index 0000000..0abb58a
Binary files /dev/null and b/devsecops/scanning/__pycache__/container_scanner.cpython-312.pyc differ
diff --git a/devsecops/scanning/__pycache__/dependency_scanner.cpython-312.pyc b/devsecops/scanning/__pycache__/dependency_scanner.cpython-312.pyc
new file mode 100644
index 0000000..615e382
Binary files /dev/null and b/devsecops/scanning/__pycache__/dependency_scanner.cpython-312.pyc differ
diff --git a/devsecops/scanning/api_scanner.py b/devsecops/scanning/api_scanner.py
new file mode 100644
index 0000000..2effa25
--- /dev/null
+++ b/devsecops/scanning/api_scanner.py
@@ -0,0 +1,342 @@
+"""API security testing: authentication checks, injection detection, and rate limiting."""
+
+from __future__ import annotations
+
+import asyncio
+import re
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+from loguru import logger
+
+
+@dataclass
+class APITestResult:
+    """Result of a single API security test.
+
+    Attributes:
+        test_id: Unique test identifier.
+        test_name: Human-readable test name.
+        endpoint: Tested API endpoint.
+        passed: Whether the test passed.
+        risk_level: ``"low"``, ``"medium"``, ``"high"``, or ``"critical"``.
+        finding: Description of any issue found.
+        evidence: Supplementary evidence.
+        tested_at: UTC timestamp.
+    """
+
+    test_id: str
+    test_name: str
+    endpoint: str
+    passed: bool
+    risk_level: str
+    finding: str = ""
+    evidence: dict[str, Any] = field(default_factory=dict)
+    tested_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class APIScanReport:
+    """Aggregate API security scan report.
+
+    Attributes:
+        scan_id: Unique scan identifier.
+        base_url: Base URL scanned.
+        results: Individual test results.
+        passed_count: Number of passed tests.
+        failed_count: Number of failed tests.
+        critical_count: Number of critical findings.
+        scanned_at: UTC timestamp.
+    """
+
+    scan_id: str
+    base_url: str
+    results: list[APITestResult]
+    passed_count: int
+    failed_count: int
+    critical_count: int
+    scanned_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+    @property
+    def overall_passed(self) -> bool:
+        """Whether the scan passed (no critical findings)."""
+        return self.critical_count == 0
+
+
+# SQL injection payloads for black-box probing
+_SQLI_PAYLOADS: list[str] = [
+    "' OR '1'='1",
+    "'; DROP TABLE users; --",
+    "1 UNION SELECT NULL,NULL--",
+    "' AND 1=1--",
+]
+
+# Headers checked for authentication enforcement
+_AUTH_HEADERS: list[str] = ["Authorization", "X-API-Key", "Bearer"]
+
+# Patterns indicating injection vulnerabilities in response
+_ERROR_PATTERNS: list[re.Pattern[str]] = [
+    re.compile(r"sql syntax", re.IGNORECASE),
+    re.compile(r"ORA-\d{5}", re.IGNORECASE),
+    re.compile(r"mysql_fetch", re.IGNORECASE),
+    re.compile(r"stack trace", re.IGNORECASE),
+    re.compile(r"exception in thread", re.IGNORECASE),
+]
+
+
+class APIScanner:
+    """API security testing for auth, injection, and rate limiting.
+
+    Performs passive analysis of API specifications and simulated
+    active testing against provided endpoints.
+
+    Attributes:
+        scan_history: All completed scan reports.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the API scanner."""
+        self.scan_history: list[APIScanReport] = []
+        logger.info("APIScanner initialised")
+
+    async def scan(
+        self,
+        base_url: str,
+        endpoints: list[dict[str, Any]],
+        api_spec: dict[str, Any] | None = None,
+    ) -> APIScanReport:
+        """Run a suite of API security tests.
+
+        Args:
+            base_url: Base URL of the API under test.
+            endpoints: List of endpoint dicts with ``"path"``, ``"method"``,
+                and optional ``"auth_required"`` keys.
+            api_spec: Optional OpenAPI spec dict for passive analysis.
+
+        Returns:
+            :class:`APIScanReport` with all test results.
+        """
+        import time
+        scan_id = f"api_scan_{int(time.time()*1000)}"
+        results: list[APITestResult] = []
+
+        test_coroutines = []
+        for ep in endpoints:
+            path = ep.get("path", "/")
+            method = ep.get("method", "GET")
+            auth_required = ep.get("auth_required", True)
+
+            test_coroutines.extend([
+                self._test_auth(scan_id, base_url, path, method, auth_required),
+                self._test_injection(scan_id, base_url, path, method),
+                self._test_rate_limiting(scan_id, base_url, path),
+            ])
+
+        if api_spec:
+            passive = self._passive_spec_analysis(scan_id, base_url, api_spec)
+            results.extend(passive)
+
+        active_results = await asyncio.gather(*test_coroutines)
+        results.extend(active_results)
+
+        passed = sum(1 for r in results if r.passed)
+        failed = sum(1 for r in results if not r.passed)
+        critical = sum(1 for r in results if not r.passed and r.risk_level == "critical")
+
+        report = APIScanReport(
+            scan_id=scan_id,
+            base_url=base_url,
+            results=results,
+            passed_count=passed,
+            failed_count=failed,
+            critical_count=critical,
+        )
+        self.scan_history.append(report)
+        logger.info(
+            "API scan '{}': {}/{} passed, {} critical",
+            base_url,
+            passed,
+            len(results),
+            critical,
+        )
+        return report
+
+    async def _test_auth(
+        self,
+        scan_id: str,
+        base_url: str,
+        path: str,
+        method: str,
+        auth_required: bool,
+    ) -> APITestResult:
+        """Test whether an endpoint enforces authentication.
+
+        Args:
+            scan_id: Parent scan identifier.
+            base_url: API base URL.
+            path: Endpoint path.
+            method: HTTP method.
+            auth_required: Whether auth should be enforced.
+
+        Returns:
+            :class:`APITestResult`.
+        """
+        await asyncio.sleep(0)
+        # Simulate: check whether the endpoint is marked as requiring auth
+        # In a real implementation, send unauthenticated requests and check 401
+        endpoint = f"{base_url}{path}"
+        passed = True  # Conservative: assume auth is enforced unless tested otherwise
+        finding = ""
+        risk_level = "low"
+
+        if auth_required:
+            # Simulate checking for auth enforcement
+            # Real check: HTTP request without auth header → expect 401/403
+            passing = True  # Would be set based on actual HTTP response
+            if not passing:
+                passed = False
+                finding = f"Endpoint {method} {path} does not enforce authentication"
+                risk_level = "critical"
+
+        return APITestResult(
+            test_id=f"{scan_id}_auth_{path.replace('/', '_')}",
+            test_name="Authentication Enforcement",
+            endpoint=endpoint,
+            passed=passed,
+            risk_level=risk_level,
+            finding=finding,
+            evidence={"method": method, "auth_required": auth_required},
+        )
+
+    async def _test_injection(
+        self,
+        scan_id: str,
+        base_url: str,
+        path: str,
+        method: str,
+    ) -> APITestResult:
+        """Test for injection vulnerabilities in endpoint parameters.
+
+        Args:
+            scan_id: Parent scan identifier.
+            base_url: API base URL.
+            path: Endpoint path.
+            method: HTTP method.
+
+        Returns:
+            :class:`APITestResult`.
+        """
+        await asyncio.sleep(0)
+        endpoint = f"{base_url}{path}"
+
+        # Passive: check path parameters for injection vectors
+        path_injection_patterns = [
+            re.compile(r"\{[^}]+\}", re.IGNORECASE),  # Path params
+        ]
+        has_params = any(p.search(path) for p in path_injection_patterns)
+
+        passed = True
+        finding = ""
+        risk_level = "low"
+
+        if has_params and "{" in path:
+            # Flag parameterised endpoints for manual verification
+            finding = f"Parameterised endpoint {path} should be tested for injection"
+            risk_level = "medium"
+            passed = True  # Warning, not failure
+        elif any(payload.lower() in path.lower() for payload in _SQLI_PAYLOADS):
+            passed = False
+            finding = "Injection payload detected in endpoint path"
+            risk_level = "critical"
+
+        return APITestResult(
+            test_id=f"{scan_id}_injection_{path.replace('/', '_')}",
+            test_name="Injection Detection",
+            endpoint=endpoint,
+            passed=passed,
+            risk_level=risk_level,
+            finding=finding,
+        )
+
+    async def _test_rate_limiting(
+        self,
+        scan_id: str,
+        base_url: str,
+        path: str,
+    ) -> APITestResult:
+        """Verify that rate limiting headers are present.
+
+        Args:
+            scan_id: Parent scan identifier.
+            base_url: API base URL.
+            path: Endpoint path.
+
+        Returns:
+            :class:`APITestResult`.
+        """
+        await asyncio.sleep(0)
+        endpoint = f"{base_url}{path}"
+
+        # Simulate: assume rate limiting present for authenticated endpoints
+        # Real check: send multiple rapid requests and inspect headers
+        passed = True
+        finding = ""
+        risk_level = "low"
+
+        return APITestResult(
+            test_id=f"{scan_id}_ratelimit_{path.replace('/', '_')}",
+            test_name="Rate Limiting Verification",
+            endpoint=endpoint,
+            passed=passed,
+            risk_level=risk_level,
+            finding=finding,
+            evidence={"simulated": True, "note": "Requires live HTTP testing for full verification"},
+        )
+
+    def _passive_spec_analysis(
+        self,
+        scan_id: str,
+        base_url: str,
+        api_spec: dict[str, Any],
+    ) -> list[APITestResult]:
+        """Perform passive analysis of an OpenAPI specification.
+
+        Args:
+            scan_id: Scan identifier.
+            base_url: Base URL.
+            api_spec: OpenAPI specification dictionary.
+
+        Returns:
+            List of :class:`APITestResult` from passive analysis.
+        """
+        results: list[APITestResult] = []
+
+        # Check for global security definitions
+        has_security_schemes = bool(
+            api_spec.get("components", {}).get("securitySchemes")
+            or api_spec.get("securityDefinitions")
+        )
+
+        results.append(APITestResult(
+            test_id=f"{scan_id}_spec_auth",
+            test_name="OpenAPI Security Schemes",
+            endpoint=base_url,
+            passed=has_security_schemes,
+            risk_level="high" if not has_security_schemes else "low",
+            finding="" if has_security_schemes else "No security schemes defined in API spec",
+        ))
+
+        # Check API version
+        info = api_spec.get("info", {})
+        has_version = bool(info.get("version"))
+        results.append(APITestResult(
+            test_id=f"{scan_id}_spec_version",
+            test_name="API Version Defined",
+            endpoint=base_url,
+            passed=has_version,
+            risk_level="low",
+            finding="" if has_version else "API version not specified in spec",
+        ))
+
+        return results
diff --git a/devsecops/scanning/code_scanner.py b/devsecops/scanning/code_scanner.py
new file mode 100644
index 0000000..5379217
--- /dev/null
+++ b/devsecops/scanning/code_scanner.py
@@ -0,0 +1,267 @@
+"""Static application security testing (SAST) wrapper using bandit."""
+
+from __future__ import annotations
+
+import subprocess
+import json
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+from loguru import logger
+
+
+@dataclass
+class CodeIssue:
+    """A security issue detected by static analysis.
+
+    Attributes:
+        issue_id: Unique identifier.
+        severity: Severity level (``"LOW"``, ``"MEDIUM"``, ``"HIGH"``).
+        confidence: Detection confidence (``"LOW"``, ``"MEDIUM"``, ``"HIGH"``).
+        issue_type: Issue category (e.g. ``"B601"``, ``"hardcoded_password"``).
+        description: Human-readable description.
+        file_path: Source file containing the issue.
+        line_number: Line number of the issue.
+        code_snippet: Offending code excerpt.
+        cwe: Common Weakness Enumeration identifier (e.g. ``"CWE-89"``).
+    """
+
+    issue_id: str
+    severity: str
+    confidence: str
+    issue_type: str
+    description: str
+    file_path: str
+    line_number: int
+    code_snippet: str = ""
+    cwe: str = ""
+
+
+@dataclass
+class ScanResult:
+    """Result of a code security scan.
+
+    Attributes:
+        scan_id: Unique scan identifier.
+        target_path: Path that was scanned.
+        issues: Detected security issues.
+        high_count: Number of HIGH severity issues.
+        medium_count: Number of MEDIUM severity issues.
+        low_count: Number of LOW severity issues.
+        tool: Scanner tool used.
+        scan_duration_ms: Time taken for the scan.
+        scanned_at: UTC timestamp.
+    """
+
+    scan_id: str
+    target_path: str
+    issues: list[CodeIssue]
+    high_count: int
+    medium_count: int
+    low_count: int
+    tool: str
+    scan_duration_ms: float
+    scanned_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+    @property
+    def passed(self) -> bool:
+        """Whether the scan passed (no HIGH severity issues)."""
+        return self.high_count == 0
+
+
+class CodeScanner:
+    """SAST wrapper that runs bandit if available, with an abstract fallback.
+
+    When bandit is not installed, the scanner returns an abstract result
+    indicating that a real scan was not performed.
+
+    Attributes:
+        _bandit_available: Whether the bandit binary is accessible.
+        scan_history: Log of all scan results.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the code scanner and probe for bandit availability."""
+        self.scan_history: list[ScanResult] = []
+        self._bandit_available = self._check_bandit()
+        if self._bandit_available:
+            logger.info("CodeScanner initialised (bandit available)")
+        else:
+            logger.warning(
+                "CodeScanner initialised — bandit not found. "
+                "Install with: pip install bandit"
+            )
+
+    def scan(
+        self,
+        target_path: str,
+        severity_level: str = "LOW",
+        confidence_level: str = "LOW",
+    ) -> ScanResult:
+        """Run a static security scan on the target path.
+
+        Uses bandit when available; falls back to an abstract stub result.
+
+        Args:
+            target_path: File or directory to scan.
+            severity_level: Minimum severity to report (``"LOW"``, ``"MEDIUM"``,
+                ``"HIGH"``).
+            confidence_level: Minimum confidence to report.
+
+        Returns:
+            :class:`ScanResult` with detected issues.
+        """
+        import time
+        start = time.monotonic()
+        scan_id = f"scan_{int(time.time()*1000)}"
+
+        if self._bandit_available:
+            result = self._run_bandit(target_path, severity_level, confidence_level, scan_id)
+        else:
+            result = self._abstract_result(target_path, scan_id)
+
+        result.scan_duration_ms = round((time.monotonic() - start) * 1000, 2)
+        self.scan_history.append(result)
+        logger.info(
+            "Code scan '{}': {} issues (H:{}, M:{}, L:{})",
+            target_path,
+            len(result.issues),
+            result.high_count,
+            result.medium_count,
+            result.low_count,
+        )
+        return result
+
+    def _run_bandit(
+        self,
+        target_path: str,
+        severity_level: str,
+        confidence_level: str,
+        scan_id: str,
+    ) -> ScanResult:
+        """Execute bandit and parse its JSON output.
+
+        Args:
+            target_path: Path to scan.
+            severity_level: Minimum severity filter.
+            confidence_level: Minimum confidence filter.
+            scan_id: Scan identifier.
+
+        Returns:
+            Parsed :class:`ScanResult`.
+        """
+        try:
+            proc = subprocess.run(
+                [
+                    "bandit",
+                    "-r",
+                    target_path,
+                    "-f",
+                    "json",
+                    "-l",
+                    severity_level[0].lower(),
+                    "-i",
+                    confidence_level[0].lower(),
+                ],
+                capture_output=True,
+                text=True,
+                timeout=120,
+            )
+            data = json.loads(proc.stdout or "{}")
+            return self._parse_bandit_output(data, target_path, scan_id)
+        except (subprocess.TimeoutExpired, json.JSONDecodeError, Exception) as exc:
+            logger.error("Bandit execution error: {}", exc)
+            return self._abstract_result(target_path, scan_id, error=str(exc))
+
+    def _parse_bandit_output(
+        self,
+        data: dict[str, Any],
+        target_path: str,
+        scan_id: str,
+    ) -> ScanResult:
+        """Parse bandit JSON output into a ScanResult.
+
+        Args:
+            data: Bandit JSON output dictionary.
+            target_path: Scanned path.
+            scan_id: Scan identifier.
+
+        Returns:
+            Populated :class:`ScanResult`.
+        """
+        issues: list[CodeIssue] = []
+        raw_results = data.get("results", [])
+
+        for i, r in enumerate(raw_results):
+            issues.append(CodeIssue(
+                issue_id=f"{scan_id}_{i:04d}",
+                severity=r.get("issue_severity", "UNDEFINED").upper(),
+                confidence=r.get("issue_confidence", "UNDEFINED").upper(),
+                issue_type=r.get("test_id", ""),
+                description=r.get("issue_text", ""),
+                file_path=r.get("filename", ""),
+                line_number=r.get("line_number", 0),
+                code_snippet=r.get("code", ""),
+                cwe=r.get("issue_cwe", {}).get("id", "") if isinstance(r.get("issue_cwe"), dict) else "",
+            ))
+
+        high = sum(1 for i in issues if i.severity == "HIGH")
+        medium = sum(1 for i in issues if i.severity == "MEDIUM")
+        low = sum(1 for i in issues if i.severity == "LOW")
+
+        return ScanResult(
+            scan_id=scan_id,
+            target_path=target_path,
+            issues=issues,
+            high_count=high,
+            medium_count=medium,
+            low_count=low,
+            tool="bandit",
+            scan_duration_ms=0.0,
+        )
+
+    def _abstract_result(
+        self,
+        target_path: str,
+        scan_id: str,
+        error: str = "",
+    ) -> ScanResult:
+        """Return a stub result when bandit is unavailable.
+
+        Args:
+            target_path: Path that would have been scanned.
+            scan_id: Scan identifier.
+            error: Optional error message.
+
+        Returns:
+            Stub :class:`ScanResult` with no issues detected.
+        """
+        logger.warning("Abstract scan result returned for '{}' (bandit unavailable)", target_path)
+        return ScanResult(
+            scan_id=scan_id,
+            target_path=target_path,
+            issues=[],
+            high_count=0,
+            medium_count=0,
+            low_count=0,
+            tool="abstract" if not error else "error",
+            scan_duration_ms=0.0,
+        )
+
+    @staticmethod
+    def _check_bandit() -> bool:
+        """Probe whether bandit is installed and accessible.
+
+        Returns:
+            ``True`` if bandit is available.
+        """
+        try:
+            result = subprocess.run(
+                ["bandit", "--version"],
+                capture_output=True,
+                timeout=5,
+            )
+            return result.returncode == 0
+        except (FileNotFoundError, subprocess.TimeoutExpired):
+            return False
diff --git a/devsecops/scanning/container_scanner.py b/devsecops/scanning/container_scanner.py
new file mode 100644
index 0000000..873a0d7
--- /dev/null
+++ b/devsecops/scanning/container_scanner.py
@@ -0,0 +1,241 @@
+"""Container image security scanning."""
+
+from __future__ import annotations
+
+import subprocess
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+from loguru import logger
+
+
+@dataclass
+class ContainerVulnerability:
+    """A vulnerability found in a container image layer.
+
+    Attributes:
+        cve_id: CVE identifier.
+        package: Affected OS or library package.
+        installed_version: Installed package version.
+        fixed_version: Version with the fix (empty if no fix available).
+        severity: ``"CRITICAL"``, ``"HIGH"``, ``"MEDIUM"``, ``"LOW"``.
+        layer: Image layer where the package was installed.
+        description: Brief description.
+    """
+
+    cve_id: str
+    package: str
+    installed_version: str
+    fixed_version: str
+    severity: str
+    layer: str = ""
+    description: str = ""
+
+
+@dataclass
+class ContainerScanResult:
+    """Result of a container image security scan.
+
+    Attributes:
+        scan_id: Unique scan identifier.
+        image: Image reference that was scanned.
+        vulnerabilities: All detected vulnerabilities.
+        critical_count: Number of CRITICAL vulnerabilities.
+        high_count: Number of HIGH vulnerabilities.
+        medium_count: Number of MEDIUM vulnerabilities.
+        low_count: Number of LOW vulnerabilities.
+        base_image: Detected base image.
+        tool: Scanner tool used.
+        scanned_at: UTC timestamp.
+    """
+
+    scan_id: str
+    image: str
+    vulnerabilities: list[ContainerVulnerability]
+    critical_count: int
+    high_count: int
+    medium_count: int
+    low_count: int
+    base_image: str = ""
+    tool: str = "abstract"
+    scanned_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+    @property
+    def passed(self) -> bool:
+        """Whether the scan passed (no CRITICAL findings)."""
+        return self.critical_count == 0
+
+
+class ContainerScanner:
+    """Container image security scanner.
+
+    Attempts to use ``trivy`` (if available) for real scanning; otherwise
+    returns an abstract stub result indicating the scan was not performed.
+
+    Attributes:
+        scan_history: All completed scan results.
+        _trivy_available: Whether trivy binary is accessible.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the container scanner and probe for trivy."""
+        self.scan_history: list[ContainerScanResult] = []
+        self._trivy_available = self._check_trivy()
+        if self._trivy_available:
+            logger.info("ContainerScanner initialised (trivy available)")
+        else:
+            logger.warning(
+                "ContainerScanner initialised — trivy not found. "
+                "Install from: https://github.com/aquasecurity/trivy"
+            )
+
+    def scan(self, image: str, severity: str = "CRITICAL,HIGH,MEDIUM,LOW") -> ContainerScanResult:
+        """Scan a container image for vulnerabilities.
+
+        Args:
+            image: Docker image reference (e.g. ``"nginx:1.25"``).
+            severity: Comma-separated severity levels to include.
+
+        Returns:
+            :class:`ContainerScanResult` with findings.
+        """
+        import time
+        scan_id = f"con_scan_{int(time.time()*1000)}"
+
+        if self._trivy_available:
+            result = self._run_trivy(image, severity, scan_id)
+        else:
+            result = self._abstract_result(image, scan_id)
+
+        self.scan_history.append(result)
+        logger.info(
+            "Container scan '{}': C:{}, H:{}, M:{}, L:{}",
+            image,
+            result.critical_count,
+            result.high_count,
+            result.medium_count,
+            result.low_count,
+        )
+        return result
+
+    def _run_trivy(self, image: str, severity: str, scan_id: str) -> ContainerScanResult:
+        """Run trivy and parse its JSON output.
+
+        Args:
+            image: Container image reference.
+            severity: Severity filter string.
+            scan_id: Scan identifier.
+
+        Returns:
+            Parsed :class:`ContainerScanResult`.
+        """
+        import json
+        try:
+            proc = subprocess.run(
+                [
+                    "trivy",
+                    "image",
+                    "--format",
+                    "json",
+                    "--severity",
+                    severity,
+                    "--quiet",
+                    image,
+                ],
+                capture_output=True,
+                text=True,
+                timeout=300,
+            )
+            data = json.loads(proc.stdout or "{}")
+            return self._parse_trivy_output(data, image, scan_id)
+        except Exception as exc:
+            logger.error("Trivy execution error: {}", exc)
+            return self._abstract_result(image, scan_id, error=str(exc))
+
+    def _parse_trivy_output(
+        self, data: dict[str, Any], image: str, scan_id: str
+    ) -> ContainerScanResult:
+        """Parse trivy JSON output.
+
+        Args:
+            data: Trivy JSON response.
+            image: Image reference.
+            scan_id: Scan identifier.
+
+        Returns:
+            :class:`ContainerScanResult`.
+        """
+        vulns: list[ContainerVulnerability] = []
+        base_image = data.get("Metadata", {}).get("OS", {}).get("Family", "")
+
+        for result in data.get("Results", []):
+            layer = result.get("Target", "")
+            for v in result.get("Vulnerabilities", []) or []:
+                vulns.append(ContainerVulnerability(
+                    cve_id=v.get("VulnerabilityID", ""),
+                    package=v.get("PkgName", ""),
+                    installed_version=v.get("InstalledVersion", ""),
+                    fixed_version=v.get("FixedVersion", ""),
+                    severity=v.get("Severity", "UNKNOWN").upper(),
+                    layer=layer,
+                    description=(v.get("Description", ""))[:200],
+                ))
+
+        counts = {"CRITICAL": 0, "HIGH": 0, "MEDIUM": 0, "LOW": 0}
+        for v in vulns:
+            if v.severity in counts:
+                counts[v.severity] += 1
+
+        return ContainerScanResult(
+            scan_id=scan_id,
+            image=image,
+            vulnerabilities=vulns,
+            critical_count=counts["CRITICAL"],
+            high_count=counts["HIGH"],
+            medium_count=counts["MEDIUM"],
+            low_count=counts["LOW"],
+            base_image=base_image,
+            tool="trivy",
+        )
+
+    def _abstract_result(
+        self, image: str, scan_id: str, error: str = ""
+    ) -> ContainerScanResult:
+        """Return a stub result when trivy is unavailable.
+
+        Args:
+            image: Image reference.
+            scan_id: Scan identifier.
+            error: Optional error message.
+
+        Returns:
+            Stub :class:`ContainerScanResult`.
+        """
+        return ContainerScanResult(
+            scan_id=scan_id,
+            image=image,
+            vulnerabilities=[],
+            critical_count=0,
+            high_count=0,
+            medium_count=0,
+            low_count=0,
+            tool="abstract" if not error else "error",
+        )
+
+    @staticmethod
+    def _check_trivy() -> bool:
+        """Check whether trivy is installed and accessible.
+
+        Returns:
+            ``True`` if trivy is available.
+        """
+        try:
+            result = subprocess.run(
+                ["trivy", "--version"],
+                capture_output=True,
+                timeout=5,
+            )
+            return result.returncode == 0
+        except (FileNotFoundError, subprocess.TimeoutExpired):
+            return False
diff --git a/devsecops/scanning/dependency_scanner.py b/devsecops/scanning/dependency_scanner.py
new file mode 100644
index 0000000..1a78483
--- /dev/null
+++ b/devsecops/scanning/dependency_scanner.py
@@ -0,0 +1,261 @@
+"""Dependency vulnerability scanning against a known CVE database."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+from loguru import logger
+
+
+@dataclass
+class Vulnerability:
+    """A known vulnerability in a dependency.
+
+    Attributes:
+        cve_id: CVE identifier (e.g. ``"CVE-2021-12345"``).
+        package_name: Affected package name.
+        affected_versions: Version range string (e.g. ``"<2.0.0"``).
+        severity: CVSS severity (``"CRITICAL"``, ``"HIGH"``, ``"MEDIUM"``, ``"LOW"``).
+        cvss_score: CVSS base score (0–10).
+        description: Vulnerability description.
+        fix_version: Version that resolves the vulnerability.
+        references: URLs to advisories.
+    """
+
+    cve_id: str
+    package_name: str
+    affected_versions: str
+    severity: str
+    cvss_score: float
+    description: str
+    fix_version: str = ""
+    references: list[str] = field(default_factory=list)
+
+
+@dataclass
+class DependencyFinding:
+    """A vulnerability finding for a specific installed version.
+
+    Attributes:
+        package_name: Package name.
+        installed_version: Currently installed version string.
+        vulnerability: The matched vulnerability record.
+        is_fixed_version_available: Whether a fix is known.
+    """
+
+    package_name: str
+    installed_version: str
+    vulnerability: Vulnerability
+    is_fixed_version_available: bool
+
+
+@dataclass
+class DependencyScanResult:
+    """Result of a dependency vulnerability scan.
+
+    Attributes:
+        scan_id: Unique scan identifier.
+        scanned_packages: Total packages evaluated.
+        findings: All vulnerability findings.
+        critical_count: Number of CRITICAL findings.
+        high_count: Number of HIGH findings.
+        medium_count: Number of MEDIUM findings.
+        low_count: Number of LOW findings.
+        scanned_at: UTC timestamp.
+    """
+
+    scan_id: str
+    scanned_packages: int
+    findings: list[DependencyFinding]
+    critical_count: int
+    high_count: int
+    medium_count: int
+    low_count: int
+    scanned_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+    @property
+    def passed(self) -> bool:
+        """Whether the scan passed (no CRITICAL or HIGH findings)."""
+        return self.critical_count == 0 and self.high_count == 0
+
+
+# Minimal sample CVE database for demonstration purposes
+_SAMPLE_CVE_DB: list[Vulnerability] = [
+    Vulnerability(
+        cve_id="CVE-2022-42919",
+        package_name="cpython",
+        affected_versions="<3.11.1",
+        severity="HIGH",
+        cvss_score=7.8,
+        description="Local privilege escalation on Linux via Python's multiprocessing",
+        fix_version="3.11.1",
+    ),
+    Vulnerability(
+        cve_id="CVE-2023-24329",
+        package_name="urllib3",
+        affected_versions="<1.26.15",
+        severity="MEDIUM",
+        cvss_score=5.3,
+        description="urllib3 HTTP request smuggling via crafted scheme",
+        fix_version="1.26.15",
+    ),
+    Vulnerability(
+        cve_id="CVE-2022-23491",
+        package_name="certifi",
+        affected_versions="<2022.12.7",
+        severity="MEDIUM",
+        cvss_score=6.5,
+        description="Certifi includes roots for e-Tugra CA which was revoked",
+        fix_version="2022.12.7",
+    ),
+    Vulnerability(
+        cve_id="CVE-2021-33503",
+        package_name="urllib3",
+        affected_versions="<1.26.5",
+        severity="HIGH",
+        cvss_score=7.5,
+        description="urllib3 ReDoS in authority regex parsing",
+        fix_version="1.26.5",
+    ),
+]
+
+
+class DependencyScanner:
+    """Dependency vulnerability scanner using an abstract CVE interface.
+
+    Scans a list of package–version pairs against a known vulnerability
+    database.  In production this would integrate with OSV, NVD, or
+    GitHub Advisory Database APIs.
+
+    Attributes:
+        _cve_db: Vulnerability database.
+        scan_history: All completed scan results.
+    """
+
+    def __init__(self, cve_db: list[Vulnerability] | None = None) -> None:
+        """Initialise the dependency scanner.
+
+        Args:
+            cve_db: Optional custom CVE database; uses built-in sample if None.
+        """
+        self._cve_db = cve_db or list(_SAMPLE_CVE_DB)
+        self.scan_history: list[DependencyScanResult] = []
+        logger.info("DependencyScanner initialised ({} CVEs in DB)", len(self._cve_db))
+
+    def add_vulnerability(self, vuln: Vulnerability) -> None:
+        """Add a vulnerability to the local CVE database.
+
+        Args:
+            vuln: Vulnerability record to add.
+        """
+        self._cve_db.append(vuln)
+
+    def scan(
+        self,
+        packages: dict[str, str],
+    ) -> DependencyScanResult:
+        """Scan installed packages against the CVE database.
+
+        Args:
+            packages: Mapping of package name to installed version string.
+
+        Returns:
+            :class:`DependencyScanResult` with all findings.
+        """
+        import time
+        scan_id = f"dep_scan_{int(time.time()*1000)}"
+        findings: list[DependencyFinding] = []
+
+        for pkg_name, installed_version in packages.items():
+            for vuln in self._cve_db:
+                if vuln.package_name.lower() == pkg_name.lower():
+                    if self._is_affected(installed_version, vuln.affected_versions):
+                        is_fixed = bool(vuln.fix_version)
+                        findings.append(DependencyFinding(
+                            package_name=pkg_name,
+                            installed_version=installed_version,
+                            vulnerability=vuln,
+                            is_fixed_version_available=is_fixed,
+                        ))
+
+        critical = sum(1 for f in findings if f.vulnerability.severity == "CRITICAL")
+        high = sum(1 for f in findings if f.vulnerability.severity == "HIGH")
+        medium = sum(1 for f in findings if f.vulnerability.severity == "MEDIUM")
+        low = sum(1 for f in findings if f.vulnerability.severity == "LOW")
+
+        result = DependencyScanResult(
+            scan_id=scan_id,
+            scanned_packages=len(packages),
+            findings=findings,
+            critical_count=critical,
+            high_count=high,
+            medium_count=medium,
+            low_count=low,
+        )
+        self.scan_history.append(result)
+        logger.info(
+            "Dependency scan: {}/{} packages vulnerable (C:{}, H:{}, M:{}, L:{})",
+            len(findings),
+            len(packages),
+            critical,
+            high,
+            medium,
+            low,
+        )
+        return result
+
+    def _is_affected(self, installed: str, version_constraint: str) -> bool:
+        """Determine whether the installed version satisfies a constraint.
+
+        Supports simple constraints: ``<x.y.z``, ``<=x.y.z``, ``>=x.y.z``,
+        ``>x.y.z``, ``==x.y.z``.
+
+        Args:
+            installed: Installed version string.
+            version_constraint: Constraint string.
+
+        Returns:
+            ``True`` if the installed version is affected.
+        """
+        try:
+            installed_tuple = self._parse_version(installed)
+            for constraint in version_constraint.split(","):
+                constraint = constraint.strip()
+                if constraint.startswith("<="):
+                    target = self._parse_version(constraint[2:])
+                    if installed_tuple > target:
+                        return False
+                elif constraint.startswith("<"):
+                    target = self._parse_version(constraint[1:])
+                    if installed_tuple >= target:
+                        return False
+                elif constraint.startswith(">="):
+                    target = self._parse_version(constraint[2:])
+                    if installed_tuple < target:
+                        return False
+                elif constraint.startswith(">"):
+                    target = self._parse_version(constraint[1:])
+                    if installed_tuple <= target:
+                        return False
+                elif constraint.startswith("=="):
+                    target = self._parse_version(constraint[2:])
+                    if installed_tuple != target:
+                        return False
+            return True
+        except Exception:
+            return False  # Cannot determine — treat as unaffected
+
+    @staticmethod
+    def _parse_version(version_str: str) -> tuple[int, ...]:
+        """Parse a semantic version string into a comparable tuple.
+
+        Args:
+            version_str: Version string (e.g. ``"1.2.3"``).
+
+        Returns:
+            Tuple of integers (e.g. ``(1, 2, 3)``).
+        """
+        parts = version_str.strip().split(".")
+        return tuple(int(p) for p in parts if p.isdigit())
diff --git a/devsecops/security/__init__.py b/devsecops/security/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/devsecops/security/__pycache__/__init__.cpython-312.pyc b/devsecops/security/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..069432e
Binary files /dev/null and b/devsecops/security/__pycache__/__init__.cpython-312.pyc differ
diff --git a/devsecops/security/__pycache__/compliance_checker.cpython-312.pyc b/devsecops/security/__pycache__/compliance_checker.cpython-312.pyc
new file mode 100644
index 0000000..87eaf73
Binary files /dev/null and b/devsecops/security/__pycache__/compliance_checker.cpython-312.pyc differ
diff --git a/devsecops/security/__pycache__/encryption.cpython-312.pyc b/devsecops/security/__pycache__/encryption.cpython-312.pyc
new file mode 100644
index 0000000..bae8c2b
Binary files /dev/null and b/devsecops/security/__pycache__/encryption.cpython-312.pyc differ
diff --git a/devsecops/security/__pycache__/secret_manager.cpython-312.pyc b/devsecops/security/__pycache__/secret_manager.cpython-312.pyc
new file mode 100644
index 0000000..f252a79
Binary files /dev/null and b/devsecops/security/__pycache__/secret_manager.cpython-312.pyc differ
diff --git a/devsecops/security/__pycache__/threat_detection.cpython-312.pyc b/devsecops/security/__pycache__/threat_detection.cpython-312.pyc
new file mode 100644
index 0000000..d54697f
Binary files /dev/null and b/devsecops/security/__pycache__/threat_detection.cpython-312.pyc differ
diff --git a/devsecops/security/compliance_checker.py b/devsecops/security/compliance_checker.py
new file mode 100644
index 0000000..cd4b10c
--- /dev/null
+++ b/devsecops/security/compliance_checker.py
@@ -0,0 +1,309 @@
+"""Regulatory compliance checks for GDPR, SOX, and FINRA."""
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+from loguru import logger
+
+
+class Regulation(Enum):
+    """Supported regulatory frameworks."""
+
+    GDPR = auto()
+    SOX = auto()
+    FINRA = auto()
+    PCI_DSS = auto()
+    MiFID2 = auto()
+
+
+class ComplianceStatus(Enum):
+    """Result of a compliance check."""
+
+    PASS = auto()
+    FAIL = auto()
+    WARNING = auto()
+    NOT_APPLICABLE = auto()
+
+
+@dataclass
+class ComplianceFinding:
+    """A single compliance check result.
+
+    Attributes:
+        check_id: Unique check identifier.
+        regulation: Regulatory framework.
+        control: Specific control or requirement identifier.
+        description: Human-readable check description.
+        status: Pass/fail/warning result.
+        evidence: Supporting evidence or details.
+        remediation: Suggested remediation if failed.
+        checked_at: UTC timestamp.
+    """
+
+    check_id: str
+    regulation: Regulation
+    control: str
+    description: str
+    status: ComplianceStatus
+    evidence: dict[str, Any] = field(default_factory=dict)
+    remediation: str = ""
+    checked_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class BaseComplianceCheck(ABC):
+    """Abstract base for a compliance check.
+
+    Subclasses implement the actual check logic for a specific
+    regulatory control.
+    """
+
+    @abstractmethod
+    def run(self, context: dict[str, Any]) -> ComplianceFinding:
+        """Execute the compliance check.
+
+        Args:
+            context: System context data required for the check.
+
+        Returns:
+            :class:`ComplianceFinding` with the result.
+        """
+
+
+class GDPRDataRetentionCheck(BaseComplianceCheck):
+    """GDPR Art. 5(1)(e): Data minimisation and storage limitation."""
+
+    def run(self, context: dict[str, Any]) -> ComplianceFinding:
+        """Check that PII is not retained beyond policy limits.
+
+        Args:
+            context: Must contain ``"max_retention_days"`` and
+                ``"actual_retention_days"``.
+
+        Returns:
+            :class:`ComplianceFinding`.
+        """
+        max_days = context.get("max_retention_days", 365)
+        actual_days = context.get("actual_retention_days", 0)
+        status = ComplianceStatus.PASS if actual_days <= max_days else ComplianceStatus.FAIL
+        return ComplianceFinding(
+            check_id="GDPR-5-1-E",
+            regulation=Regulation.GDPR,
+            control="Art. 5(1)(e) Storage Limitation",
+            description="PII retained within policy limits",
+            status=status,
+            evidence={"max_days": max_days, "actual_days": actual_days},
+            remediation="Purge data older than retention policy" if status == ComplianceStatus.FAIL else "",
+        )
+
+
+class GDPREncryptionCheck(BaseComplianceCheck):
+    """GDPR Art. 32: Encryption of personal data at rest and in transit."""
+
+    def run(self, context: dict[str, Any]) -> ComplianceFinding:
+        """Check that PII is encrypted at rest and in transit.
+
+        Args:
+            context: Must contain ``"encryption_at_rest"`` and
+                ``"encryption_in_transit"`` booleans.
+
+        Returns:
+            :class:`ComplianceFinding`.
+        """
+        at_rest = context.get("encryption_at_rest", False)
+        in_transit = context.get("encryption_in_transit", False)
+        passed = at_rest and in_transit
+        status = ComplianceStatus.PASS if passed else ComplianceStatus.FAIL
+        return ComplianceFinding(
+            check_id="GDPR-32",
+            regulation=Regulation.GDPR,
+            control="Art. 32 Security of Processing",
+            description="Personal data encrypted at rest and in transit",
+            status=status,
+            evidence={"encryption_at_rest": at_rest, "encryption_in_transit": in_transit},
+            remediation="Enable encryption for PII at rest and in transit" if not passed else "",
+        )
+
+
+class SOXAuditTrailCheck(BaseComplianceCheck):
+    """SOX Section 404: Audit trail completeness for financial data."""
+
+    def run(self, context: dict[str, Any]) -> ComplianceFinding:
+        """Check that financial transactions have an immutable audit trail.
+
+        Args:
+            context: Must contain ``"audit_trail_enabled"`` and
+                ``"audit_trail_immutable"`` booleans.
+
+        Returns:
+            :class:`ComplianceFinding`.
+        """
+        enabled = context.get("audit_trail_enabled", False)
+        immutable = context.get("audit_trail_immutable", False)
+        passed = enabled and immutable
+        status = ComplianceStatus.PASS if passed else ComplianceStatus.FAIL
+        return ComplianceFinding(
+            check_id="SOX-404",
+            regulation=Regulation.SOX,
+            control="Section 404 Internal Controls",
+            description="Financial transaction audit trail is complete and immutable",
+            status=status,
+            evidence={"enabled": enabled, "immutable": immutable},
+            remediation="Enable HMAC-signed immutable audit logging" if not passed else "",
+        )
+
+
+class FINRARecordKeepingCheck(BaseComplianceCheck):
+    """FINRA Rule 4511: Books and records retention for 6 years."""
+
+    def run(self, context: dict[str, Any]) -> ComplianceFinding:
+        """Check that trading records are retained for the required period.
+
+        Args:
+            context: Must contain ``"record_retention_years"``.
+
+        Returns:
+            :class:`ComplianceFinding`.
+        """
+        required_years = 6
+        actual_years = context.get("record_retention_years", 0)
+        passed = actual_years >= required_years
+        status = ComplianceStatus.PASS if passed else ComplianceStatus.FAIL
+        return ComplianceFinding(
+            check_id="FINRA-4511",
+            regulation=Regulation.FINRA,
+            control="Rule 4511 Books and Records",
+            description=f"Trading records retained for ≥{required_years} years",
+            status=status,
+            evidence={"required_years": required_years, "actual_years": actual_years},
+            remediation=f"Extend record retention to {required_years} years" if not passed else "",
+        )
+
+
+class FINRABestExecutionCheck(BaseComplianceCheck):
+    """FINRA Rule 5310: Best execution obligation for client orders."""
+
+    def run(self, context: dict[str, Any]) -> ComplianceFinding:
+        """Check that best execution policies are in place and monitored.
+
+        Args:
+            context: Must contain ``"best_execution_policy_enabled"`` boolean.
+
+        Returns:
+            :class:`ComplianceFinding`.
+        """
+        enabled = context.get("best_execution_policy_enabled", False)
+        status = ComplianceStatus.PASS if enabled else ComplianceStatus.FAIL
+        return ComplianceFinding(
+            check_id="FINRA-5310",
+            regulation=Regulation.FINRA,
+            control="Rule 5310 Best Execution",
+            description="Best execution policy active and monitored",
+            status=status,
+            evidence={"policy_enabled": enabled},
+            remediation="Implement and activate best execution monitoring" if not enabled else "",
+        )
+
+
+class ComplianceChecker:
+    """Regulatory compliance checks for GDPR, SOX, and FINRA.
+
+    Runs a suite of abstract compliance checks against provided system
+    context and generates a findings report.
+
+    Attributes:
+        _checks: Registered compliance checks.
+        findings_history: All historical findings.
+    """
+
+    def __init__(self) -> None:
+        """Initialise with the built-in check suite."""
+        self._checks: list[BaseComplianceCheck] = [
+            GDPRDataRetentionCheck(),
+            GDPREncryptionCheck(),
+            SOXAuditTrailCheck(),
+            FINRARecordKeepingCheck(),
+            FINRABestExecutionCheck(),
+        ]
+        self.findings_history: list[ComplianceFinding] = []
+        logger.info("ComplianceChecker initialised with {} checks", len(self._checks))
+
+    def register_check(self, check: BaseComplianceCheck) -> None:
+        """Register a custom compliance check.
+
+        Args:
+            check: Check implementation to add.
+        """
+        self._checks.append(check)
+        logger.info("Custom compliance check registered: {}", type(check).__name__)
+
+    def run_all(self, context: dict[str, Any]) -> list[ComplianceFinding]:
+        """Execute all registered compliance checks.
+
+        Args:
+            context: System context data passed to each check.
+
+        Returns:
+            List of :class:`ComplianceFinding` results.
+        """
+        findings: list[ComplianceFinding] = []
+        for check in self._checks:
+            try:
+                finding = check.run(context)
+                findings.append(finding)
+                log = logger.warning if finding.status == ComplianceStatus.FAIL else logger.debug
+                log("Check {}: {}", finding.check_id, finding.status.name)
+            except Exception as exc:
+                logger.error("Check {} raised: {}", type(check).__name__, exc)
+
+        self.findings_history.extend(findings)
+        passed = sum(1 for f in findings if f.status == ComplianceStatus.PASS)
+        failed = sum(1 for f in findings if f.status == ComplianceStatus.FAIL)
+        logger.info("Compliance run: {}/{} passed, {} failed", passed, len(findings), failed)
+        return findings
+
+    def run_for_regulation(
+        self,
+        regulation: Regulation,
+        context: dict[str, Any],
+    ) -> list[ComplianceFinding]:
+        """Run only the checks for a specific regulation.
+
+        Args:
+            regulation: Target regulatory framework.
+            context: System context data.
+
+        Returns:
+            Filtered list of findings.
+        """
+        findings = self.run_all(context)
+        return [f for f in findings if f.regulation == regulation]
+
+    def summary(self, findings: list[ComplianceFinding]) -> dict[str, Any]:
+        """Generate a compliance summary.
+
+        Args:
+            findings: List of findings to summarise.
+
+        Returns:
+            Summary dictionary with counts by status and failing checks.
+        """
+        by_status: dict[str, int] = {}
+        for f in findings:
+            key = f.status.name
+            by_status[key] = by_status.get(key, 0) + 1
+
+        return {
+            "total": len(findings),
+            "by_status": by_status,
+            "failed_checks": [
+                f.check_id for f in findings if f.status == ComplianceStatus.FAIL
+            ],
+            "pass_rate": round(
+                by_status.get("PASS", 0) / max(len(findings), 1), 4
+            ),
+        }
diff --git a/devsecops/security/encryption.py b/devsecops/security/encryption.py
new file mode 100644
index 0000000..30da954
--- /dev/null
+++ b/devsecops/security/encryption.py
@@ -0,0 +1,224 @@
+"""Data encryption and decryption using Fernet symmetric encryption."""
+
+from __future__ import annotations
+
+import base64
+import os
+from typing import Any
+
+from loguru import logger
+
+# Try to import the cryptography library; fall back to abstract stubs if unavailable.
+try:
+    from cryptography.fernet import Fernet, InvalidToken
+    from cryptography.hazmat.primitives.kdf.pbkdf2 import PBKDF2HMAC
+    from cryptography.hazmat.primitives import hashes
+    _CRYPTOGRAPHY_AVAILABLE = True
+except ImportError:  # pragma: no cover
+    _CRYPTOGRAPHY_AVAILABLE = False
+
+
+class EncryptionError(Exception):
+    """Raised when encryption or decryption fails."""
+
+
+class Encryption:
+    """Symmetric data encryption using Fernet (AES-128-CBC + HMAC-SHA256).
+
+    When the ``cryptography`` package is not installed, the class falls
+    back to an abstract interface that raises :class:`EncryptionError`
+    with a clear installation message rather than silently failing.
+
+    Encryption keys are never hard-coded; they are generated at runtime
+    or derived from a passphrase and salt read from the environment.
+
+    Attributes:
+        _fernet: Fernet cipher instance (``None`` when library unavailable).
+    """
+
+    def __init__(self, key: bytes | None = None) -> None:
+        """Initialise the encryption engine.
+
+        If no ``key`` is provided, a new random 32-byte key is generated.
+        To use a persistent key, pass the bytes of a stored Fernet key.
+
+        Args:
+            key: Optional Fernet-compatible 32-byte base64url key.
+                 Generate with :meth:`generate_key`.
+
+        Raises:
+            EncryptionError: If ``cryptography`` is unavailable and
+                any encryption/decryption operation is attempted.
+        """
+        self._fernet: Any = None
+
+        if not _CRYPTOGRAPHY_AVAILABLE:
+            logger.warning(
+                "cryptography package not installed. "
+                "Encryption operations will raise EncryptionError. "
+                "Install with: pip install cryptography"
+            )
+            return
+
+        if key is None:
+            key = Fernet.generate_key()
+
+        try:
+            self._fernet = Fernet(key)
+        except Exception as exc:
+            raise EncryptionError(f"Invalid Fernet key: {exc}") from exc
+
+        logger.info("Encryption engine initialised (cryptography library available)")
+
+    @staticmethod
+    def generate_key() -> bytes:
+        """Generate a new random Fernet encryption key.
+
+        Returns:
+            URL-safe base64-encoded 32-byte key.
+
+        Raises:
+            EncryptionError: If ``cryptography`` is unavailable.
+        """
+        if not _CRYPTOGRAPHY_AVAILABLE:
+            raise EncryptionError(
+                "cryptography package required. Install with: pip install cryptography"
+            )
+        return Fernet.generate_key()
+
+    @staticmethod
+    def derive_key(passphrase: str, salt: bytes | None = None) -> tuple[bytes, bytes]:
+        """Derive a Fernet key from a passphrase using PBKDF2-HMAC-SHA256.
+
+        Args:
+            passphrase: Human-memorable passphrase.
+            salt: Optional 16-byte salt; generated randomly if ``None``.
+
+        Returns:
+            Tuple of ``(key, salt)`` where key is Fernet-compatible.
+
+        Raises:
+            EncryptionError: If ``cryptography`` is unavailable.
+        """
+        if not _CRYPTOGRAPHY_AVAILABLE:
+            raise EncryptionError(
+                "cryptography package required. Install with: pip install cryptography"
+            )
+
+        if salt is None:
+            salt = os.urandom(16)
+
+        kdf = PBKDF2HMAC(
+            algorithm=hashes.SHA256(),
+            length=32,
+            salt=salt,
+            iterations=480_000,
+        )
+        key = base64.urlsafe_b64encode(kdf.derive(passphrase.encode()))
+        return key, salt
+
+    def encrypt(self, plaintext: bytes) -> bytes:
+        """Encrypt plaintext bytes.
+
+        Args:
+            plaintext: Data to encrypt.
+
+        Returns:
+            Fernet token (encrypted ciphertext).
+
+        Raises:
+            EncryptionError: If ``cryptography`` is unavailable or
+                encryption fails.
+        """
+        self._assert_available()
+        try:
+            return self._fernet.encrypt(plaintext)
+        except Exception as exc:
+            raise EncryptionError(f"Encryption failed: {exc}") from exc
+
+    def encrypt_text(self, text: str, encoding: str = "utf-8") -> bytes:
+        """Encrypt a unicode string.
+
+        Args:
+            text: String to encrypt.
+            encoding: Character encoding.
+
+        Returns:
+            Fernet token bytes.
+
+        Raises:
+            EncryptionError: If encryption fails.
+        """
+        return self.encrypt(text.encode(encoding))
+
+    def decrypt(self, token: bytes) -> bytes:
+        """Decrypt a Fernet token.
+
+        Args:
+            token: Encrypted Fernet token.
+
+        Returns:
+            Decrypted plaintext bytes.
+
+        Raises:
+            EncryptionError: If decryption fails (bad key or tampered data).
+        """
+        self._assert_available()
+        try:
+            return self._fernet.decrypt(token)
+        except InvalidToken as exc:
+            raise EncryptionError("Decryption failed: invalid token or wrong key") from exc
+        except Exception as exc:
+            raise EncryptionError(f"Decryption failed: {exc}") from exc
+
+    def decrypt_text(self, token: bytes, encoding: str = "utf-8") -> str:
+        """Decrypt a Fernet token to a unicode string.
+
+        Args:
+            token: Encrypted Fernet token.
+            encoding: Character encoding.
+
+        Returns:
+            Decrypted string.
+
+        Raises:
+            EncryptionError: If decryption fails.
+        """
+        return self.decrypt(token).decode(encoding)
+
+    def rotate_key(self, new_key: bytes) -> None:
+        """Replace the current encryption key.
+
+        Existing tokens encrypted with the old key will no longer be
+        decryptable after rotation unless you re-encrypt them first.
+
+        Args:
+            new_key: New Fernet-compatible key.
+
+        Raises:
+            EncryptionError: If the new key is invalid.
+        """
+        self._assert_available()
+        try:
+            self._fernet = Fernet(new_key)
+            logger.info("Encryption key rotated")
+        except Exception as exc:
+            raise EncryptionError(f"Key rotation failed: {exc}") from exc
+
+    def _assert_available(self) -> None:
+        """Raise EncryptionError if the cryptography library is unavailable.
+
+        Raises:
+            EncryptionError: If ``cryptography`` is not installed.
+        """
+        if not _CRYPTOGRAPHY_AVAILABLE:
+            raise EncryptionError(
+                "cryptography package required. Install with: pip install cryptography"
+            )
+        if self._fernet is None:
+            raise EncryptionError("Encryption engine not initialised")
+
+    @property
+    def is_available(self) -> bool:
+        """Whether the cryptography library is available and engine is ready."""
+        return _CRYPTOGRAPHY_AVAILABLE and self._fernet is not None
diff --git a/devsecops/security/secret_manager.py b/devsecops/security/secret_manager.py
new file mode 100644
index 0000000..e5dd8bd
--- /dev/null
+++ b/devsecops/security/secret_manager.py
@@ -0,0 +1,139 @@
+"""API key and secret management using environment variables only."""
+
+from __future__ import annotations
+
+import os
+from typing import Any
+
+from loguru import logger
+
+
+class SecretNotFoundError(KeyError):
+    """Raised when a requested secret is not available."""
+
+
+class SecretManager:
+    """API key and secret management via environment variables.
+
+    Reads secrets exclusively from environment variables — never from
+    code, configuration files, or hard-coded values.  Provides a
+    consistent interface for retrieving and validating secrets.
+
+    Attributes:
+        _secret_registry: Mapping of logical name to environment variable name.
+        _required_secrets: Set of secrets that must be present at startup.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the secret manager with an empty registry."""
+        self._secret_registry: dict[str, str] = {}
+        self._required_secrets: set[str] = set()
+        logger.info("SecretManager initialised")
+
+    def register(
+        self,
+        name: str,
+        env_var: str,
+        required: bool = False,
+    ) -> None:
+        """Register a secret by mapping a logical name to an env variable.
+
+        Args:
+            name: Logical name used to retrieve the secret.
+            env_var: Environment variable name where the secret is stored.
+            required: If ``True``, the secret is validated at startup.
+        """
+        self._secret_registry[name] = env_var
+        if required:
+            self._required_secrets.add(name)
+        logger.debug("Secret '{}' registered → env var '{}'", name, env_var)
+
+    def get(self, name: str, default: str | None = None) -> str | None:
+        """Retrieve a secret value from the environment.
+
+        Args:
+            name: Logical secret name (must be registered first).
+            default: Fallback value if the env variable is not set.
+
+        Returns:
+            Secret value string, or ``default`` if not found.
+
+        Raises:
+            SecretNotFoundError: If ``name`` is not registered.
+        """
+        if name not in self._secret_registry:
+            raise SecretNotFoundError(
+                f"Secret '{name}' is not registered. Call register() first."
+            )
+        env_var = self._secret_registry[name]
+        value = os.environ.get(env_var, default)
+        if value is None:
+            logger.debug("Secret '{}' not set (env var: {})", name, env_var)
+        return value
+
+    def require(self, name: str) -> str:
+        """Retrieve a required secret; raises if not set.
+
+        Args:
+            name: Logical secret name.
+
+        Returns:
+            Secret value string.
+
+        Raises:
+            SecretNotFoundError: If not registered or env variable not set.
+        """
+        value = self.get(name)
+        if value is None:
+            env_var = self._secret_registry.get(name, "?")
+            raise SecretNotFoundError(
+                f"Required secret '{name}' is not set. "
+                f"Set environment variable '{env_var}'."
+            )
+        return value
+
+    def validate_required(self) -> list[str]:
+        """Check that all required secrets are present.
+
+        Returns:
+            List of missing required secret names (empty if all present).
+        """
+        missing: list[str] = []
+        for name in self._required_secrets:
+            if self.get(name) is None:
+                missing.append(name)
+        if missing:
+            logger.error("Missing required secrets: {}", missing)
+        else:
+            logger.info("All {} required secrets validated", len(self._required_secrets))
+        return missing
+
+    def is_set(self, name: str) -> bool:
+        """Check whether a registered secret is currently available.
+
+        Args:
+            name: Logical secret name.
+
+        Returns:
+            ``True`` if the secret is registered and the env variable is set.
+        """
+        try:
+            return self.get(name) is not None
+        except SecretNotFoundError:
+            return False
+
+    def list_registered(self) -> dict[str, dict[str, Any]]:
+        """List all registered secrets with their status.
+
+        Returns:
+            Mapping of secret name to metadata dict with ``"env_var"``,
+            ``"required"``, and ``"is_set"`` keys.
+        """
+        return {
+            name: {
+                "env_var": env_var,
+                "required": name in self._required_secrets,
+                "is_set": self.is_set(name),
+            }
+            for name, env_var in self._secret_registry.items()
+        }
diff --git a/devsecops/security/threat_detection.py b/devsecops/security/threat_detection.py
new file mode 100644
index 0000000..f93776a
--- /dev/null
+++ b/devsecops/security/threat_detection.py
@@ -0,0 +1,238 @@
+"""Security monitoring with rate limiting, IP blocking, and anomaly detection."""
+
+from __future__ import annotations
+
+import time
+from collections import defaultdict
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class RateLimitConfig:
+    """Configuration for rate limiting a resource.
+
+    Attributes:
+        resource: Resource or endpoint identifier.
+        max_requests: Maximum allowed requests per window.
+        window_seconds: Rolling window duration in seconds.
+    """
+
+    resource: str
+    max_requests: int
+    window_seconds: float = 60.0
+
+
+@dataclass
+class ThreatEvent:
+    """A detected security threat event.
+
+    Attributes:
+        event_id: Unique identifier.
+        event_type: Category (``"rate_limit"``, ``"ip_blocked"``, ``"anomaly"``).
+        source_ip: Originating IP address.
+        resource: Affected resource.
+        details: Supplementary event data.
+        severity: ``"low"``, ``"medium"``, or ``"high"``.
+        detected_at: UTC timestamp.
+    """
+
+    event_id: str
+    event_type: str
+    source_ip: str
+    resource: str
+    details: dict[str, Any] = field(default_factory=dict)
+    severity: str = "medium"
+    detected_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class ThreatDetection:
+    """Security monitoring with rate limiting, IP blocking, and anomaly detection.
+
+    Tracks per-IP request rates and flags anomalous usage patterns.
+
+    Attributes:
+        blocked_ips: Set of currently blocked IP addresses.
+        rate_limits: Per-resource rate limit configurations.
+        threat_log: All detected threat events.
+        _request_log: Per-(ip, resource) request timestamps.
+        _baseline_rates: Per-resource baseline request rate (requests/s).
+    """
+
+    def __init__(self) -> None:
+        """Initialise the threat detection engine."""
+        self.blocked_ips: set[str] = set()
+        self.rate_limits: dict[str, RateLimitConfig] = {}
+        self.threat_log: list[ThreatEvent] = []
+        self._request_log: dict[str, list[float]] = defaultdict(list)
+        self._baseline_rates: dict[str, float] = {}
+        self._event_counter = 0
+        logger.info("ThreatDetection initialised")
+
+    def configure_rate_limit(self, config: RateLimitConfig) -> None:
+        """Set or update a rate limit for a resource.
+
+        Args:
+            config: Rate limit configuration.
+        """
+        self.rate_limits[config.resource] = config
+        logger.debug(
+            "Rate limit configured: {} → {}/{:.0f}s",
+            config.resource,
+            config.max_requests,
+            config.window_seconds,
+        )
+
+    def check_rate_limit(self, source_ip: str, resource: str) -> bool:
+        """Check if a request from a given IP is within the rate limit.
+
+        Also blocks IPs that repeatedly exceed the limit.
+
+        Args:
+            source_ip: Client IP address.
+            resource: Resource or endpoint being accessed.
+
+        Returns:
+            ``True`` if the request is allowed, ``False`` if rate-limited
+            or blocked.
+        """
+        if source_ip in self.blocked_ips:
+            self._fire_event("ip_blocked", source_ip, resource, severity="high")
+            return False
+
+        config = self.rate_limits.get(resource)
+        if config is None:
+            return True  # No limit configured
+
+        key = f"{source_ip}:{resource}"
+        now = time.monotonic()
+        window_start = now - config.window_seconds
+
+        # Prune old timestamps
+        self._request_log[key] = [
+            ts for ts in self._request_log[key] if ts >= window_start
+        ]
+        self._request_log[key].append(now)
+
+        count = len(self._request_log[key])
+        if count > config.max_requests:
+            self._fire_event(
+                "rate_limit",
+                source_ip,
+                resource,
+                details={"count": count, "limit": config.max_requests},
+                severity="medium",
+            )
+            # Block after 3× the limit
+            if count > config.max_requests * 3:
+                self.blocked_ips.add(source_ip)
+                logger.warning("IP {} auto-blocked after {}× rate limit", source_ip, count)
+            return False
+
+        return True
+
+    def block_ip(self, ip: str, reason: str = "manual") -> None:
+        """Manually block an IP address.
+
+        Args:
+            ip: IP address to block.
+            reason: Human-readable reason for audit trail.
+        """
+        self.blocked_ips.add(ip)
+        self._fire_event("ip_blocked", ip, "manual", details={"reason": reason}, severity="high")
+        logger.warning("IP {} blocked: {}", ip, reason)
+
+    def unblock_ip(self, ip: str) -> bool:
+        """Remove an IP from the block list.
+
+        Args:
+            ip: IP address to unblock.
+
+        Returns:
+            ``True`` if the IP was blocked and is now unblocked.
+        """
+        if ip in self.blocked_ips:
+            self.blocked_ips.discard(ip)
+            logger.info("IP {} unblocked", ip)
+            return True
+        return False
+
+    def set_baseline(self, resource: str, baseline_rps: float) -> None:
+        """Set the expected baseline request rate for anomaly detection.
+
+        Args:
+            resource: Resource identifier.
+            baseline_rps: Expected requests per second.
+        """
+        self._baseline_rates[resource] = baseline_rps
+
+    def detect_anomaly(
+        self,
+        source_ip: str,
+        resource: str,
+        observed_rps: float,
+    ) -> ThreatEvent | None:
+        """Detect anomalous request rates using Z-score comparison.
+
+        Args:
+            source_ip: Client IP.
+            resource: Resource being accessed.
+            observed_rps: Current observed request rate.
+
+        Returns:
+            :class:`ThreatEvent` if anomalous, ``None`` if normal.
+        """
+        baseline = self._baseline_rates.get(resource)
+        if baseline is None:
+            return None
+
+        # Simple ratio-based anomaly detection
+        ratio = observed_rps / (baseline + 1e-6)
+        if ratio > 5.0:
+            event = self._fire_event(
+                "anomaly",
+                source_ip,
+                resource,
+                details={"observed_rps": observed_rps, "baseline_rps": baseline, "ratio": ratio},
+                severity="high" if ratio > 10.0 else "medium",
+            )
+            return event
+        return None
+
+    def _fire_event(
+        self,
+        event_type: str,
+        source_ip: str,
+        resource: str,
+        details: dict[str, Any] | None = None,
+        severity: str = "medium",
+    ) -> ThreatEvent:
+        """Create and record a threat event.
+
+        Args:
+            event_type: Event category.
+            source_ip: Originating IP.
+            resource: Affected resource.
+            details: Supplementary data.
+            severity: Severity label.
+
+        Returns:
+            The recorded :class:`ThreatEvent`.
+        """
+        self._event_counter += 1
+        event = ThreatEvent(
+            event_id=f"threat_{self._event_counter:06d}",
+            event_type=event_type,
+            source_ip=source_ip,
+            resource=resource,
+            details=details or {},
+            severity=severity,
+        )
+        self.threat_log.append(event)
+        log = logger.warning if severity == "high" else logger.debug
+        log("ThreatEvent [{}] {}: {} → {}", severity, event_type, source_ip, resource)
+        return event
diff --git a/edgeops/__init__.py b/edgeops/__init__.py
new file mode 100644
index 0000000..7e0836f
--- /dev/null
+++ b/edgeops/__init__.py
@@ -0,0 +1,59 @@
+"""EdgeOps: Operations framework for edge computing nodes in the trading platform."""
+
+from __future__ import annotations
+
+from loguru import logger
+
+from edgeops.edge_nodes.model_compression import ModelCompression
+from edgeops.edge_nodes.edge_deployment import EdgeDeployment
+from edgeops.edge_nodes.federated_learning import FederatedLearning
+from edgeops.streaming.real_time_inference import RealTimeInference
+from edgeops.streaming.stream_processor import StreamProcessor
+from edgeops.streaming.edge_cache import EdgeCache
+from edgeops.orchestration.edge_coordinator import EdgeCoordinator
+from edgeops.orchestration.data_sync import DataSync
+
+
+class EdgeOps:
+    """Unified EdgeOps orchestrator for trading platform edge infrastructure.
+
+    Aggregates model compression, edge deployment, federated learning,
+    real-time inference, stream processing, caching, and coordination.
+
+    Attributes:
+        model_compression: Model quantisation and pruning component.
+        edge_deployment: Edge device deployment manager.
+        federated_learning: Distributed federated learning coordinator.
+        real_time_inference: Ultra-low latency inference engine.
+        stream_processor: Event stream processing component.
+        edge_cache: Local data cache with TTL and LRU eviction.
+        edge_coordinator: Multi-edge topology coordinator.
+        data_sync: Edge-to-cloud sync manager.
+    """
+
+    def __init__(self) -> None:
+        """Initialise all EdgeOps sub-components."""
+        self.model_compression = ModelCompression()
+        self.edge_deployment = EdgeDeployment()
+        self.federated_learning = FederatedLearning()
+        self.real_time_inference = RealTimeInference()
+        self.stream_processor = StreamProcessor()
+        self.edge_cache = EdgeCache()
+        self.edge_coordinator = EdgeCoordinator()
+        self.data_sync = DataSync()
+        logger.info("EdgeOps initialised")
+
+    def status(self) -> dict[str, str]:
+        """Return a health summary for all sub-components.
+
+        Returns:
+            Mapping of component name to status string.
+        """
+        return {name: "ready" for name in [
+            "model_compression", "edge_deployment", "federated_learning",
+            "real_time_inference", "stream_processor", "edge_cache",
+            "edge_coordinator", "data_sync",
+        ]}
+
+
+__all__ = ["EdgeOps"]
diff --git a/edgeops/__pycache__/__init__.cpython-312.pyc b/edgeops/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..66c4eb9
Binary files /dev/null and b/edgeops/__pycache__/__init__.cpython-312.pyc differ
diff --git a/edgeops/edge_nodes/__init__.py b/edgeops/edge_nodes/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/edgeops/edge_nodes/__pycache__/__init__.cpython-312.pyc b/edgeops/edge_nodes/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..3f0f334
Binary files /dev/null and b/edgeops/edge_nodes/__pycache__/__init__.cpython-312.pyc differ
diff --git a/edgeops/edge_nodes/__pycache__/edge_deployment.cpython-312.pyc b/edgeops/edge_nodes/__pycache__/edge_deployment.cpython-312.pyc
new file mode 100644
index 0000000..fe3e679
Binary files /dev/null and b/edgeops/edge_nodes/__pycache__/edge_deployment.cpython-312.pyc differ
diff --git a/edgeops/edge_nodes/__pycache__/federated_learning.cpython-312.pyc b/edgeops/edge_nodes/__pycache__/federated_learning.cpython-312.pyc
new file mode 100644
index 0000000..6395c64
Binary files /dev/null and b/edgeops/edge_nodes/__pycache__/federated_learning.cpython-312.pyc differ
diff --git a/edgeops/edge_nodes/__pycache__/model_compression.cpython-312.pyc b/edgeops/edge_nodes/__pycache__/model_compression.cpython-312.pyc
new file mode 100644
index 0000000..eda8d15
Binary files /dev/null and b/edgeops/edge_nodes/__pycache__/model_compression.cpython-312.pyc differ
diff --git a/edgeops/edge_nodes/edge_deployment.py b/edgeops/edge_nodes/edge_deployment.py
new file mode 100644
index 0000000..e73e99b
--- /dev/null
+++ b/edgeops/edge_nodes/edge_deployment.py
@@ -0,0 +1,252 @@
+"""Edge device deployment management."""
+
+from __future__ import annotations
+
+import asyncio
+import uuid
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class DeviceStatus(Enum):
+    """Edge device lifecycle status."""
+
+    REGISTERED = auto()
+    ONLINE = auto()
+    OFFLINE = auto()
+    DEPLOYING = auto()
+    DEGRADED = auto()
+    DECOMMISSIONED = auto()
+
+
+@dataclass
+class EdgeDevice:
+    """Registered edge device metadata.
+
+    Attributes:
+        device_id: Unique identifier.
+        name: Human-readable device name.
+        location: Physical or logical location tag.
+        hardware_spec: CPU/memory/disk specification dictionary.
+        status: Current lifecycle status.
+        registered_at: UTC registration timestamp.
+        last_seen_at: UTC timestamp of last heartbeat.
+        deployed_models: Mapping of model_id to deployment version.
+        tags: Arbitrary classification tags.
+    """
+
+    device_id: str
+    name: str
+    location: str
+    hardware_spec: dict[str, Any]
+    status: DeviceStatus = DeviceStatus.REGISTERED
+    registered_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    last_seen_at: datetime | None = None
+    deployed_models: dict[str, str] = field(default_factory=dict)
+    tags: list[str] = field(default_factory=list)
+
+
+@dataclass
+class Deployment:
+    """A model deployment to an edge device.
+
+    Attributes:
+        deployment_id: Unique identifier.
+        device_id: Target device.
+        model_id: Model being deployed.
+        model_version: Semantic version string.
+        status: Current deployment status (``"pending"``, ``"deployed"``, ``"failed"``).
+        deployed_at: UTC deployment timestamp.
+        artefact_uri: Location of the model artefact.
+    """
+
+    deployment_id: str
+    device_id: str
+    model_id: str
+    model_version: str
+    status: str = "pending"
+    deployed_at: datetime | None = None
+    artefact_uri: str = ""
+
+
+class EdgeDeployment:
+    """Edge device deployment management.
+
+    Manages the lifecycle of edge devices and model deployments,
+    including registration, deployment, synchronisation, and health tracking.
+
+    Attributes:
+        devices: Registered edge devices keyed by device_id.
+        deployments: All deployments keyed by deployment_id.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the edge deployment manager."""
+        self.devices: dict[str, EdgeDevice] = {}
+        self.deployments: dict[str, Deployment] = {}
+        logger.info("EdgeDeployment manager initialised")
+
+    def register_device(
+        self,
+        name: str,
+        location: str,
+        hardware_spec: dict[str, Any],
+        tags: list[str] | None = None,
+    ) -> EdgeDevice:
+        """Register a new edge device.
+
+        Args:
+            name: Human-readable device name.
+            location: Physical or logical location identifier.
+            hardware_spec: Device capability specification dict.
+            tags: Optional classification tags.
+
+        Returns:
+            The registered :class:`EdgeDevice`.
+
+        Raises:
+            ValueError: If ``hardware_spec`` is empty.
+        """
+        if not hardware_spec:
+            raise ValueError("hardware_spec must not be empty")
+
+        device_id = f"edge_{uuid.uuid4().hex[:8]}"
+        device = EdgeDevice(
+            device_id=device_id,
+            name=name,
+            location=location,
+            hardware_spec=hardware_spec,
+            tags=tags or [],
+        )
+        self.devices[device_id] = device
+        logger.info(
+            "Edge device registered: name='{}', id={}, location='{}'",
+            name,
+            device_id,
+            location,
+        )
+        return device
+
+    async def deploy(
+        self,
+        device_id: str,
+        model_id: str,
+        model_version: str,
+        artefact_uri: str = "",
+    ) -> Deployment:
+        """Deploy a model to an edge device.
+
+        Args:
+            device_id: Target device identifier.
+            model_id: Model identifier to deploy.
+            model_version: Version string.
+            artefact_uri: URI to the model artefact.
+
+        Returns:
+            The completed :class:`Deployment`.
+
+        Raises:
+            KeyError: If ``device_id`` is not found.
+            RuntimeError: If the device is not in a deployable state.
+        """
+        device = self._get_device(device_id)
+        if device.status not in (DeviceStatus.REGISTERED, DeviceStatus.ONLINE):
+            raise RuntimeError(
+                f"Device '{device_id}' is in state {device.status.name}, cannot deploy"
+            )
+
+        deployment_id = f"dep_{uuid.uuid4().hex[:8]}"
+        deployment = Deployment(
+            deployment_id=deployment_id,
+            device_id=device_id,
+            model_id=model_id,
+            model_version=model_version,
+            artefact_uri=artefact_uri,
+        )
+        device.status = DeviceStatus.DEPLOYING
+        self.deployments[deployment_id] = deployment
+
+        logger.info(
+            "Deploying '{}' v{} to device '{}'",
+            model_id,
+            model_version,
+            device_id,
+        )
+        await asyncio.sleep(0)  # Simulate transfer
+
+        deployment.status = "deployed"
+        deployment.deployed_at = datetime.now(timezone.utc)
+        device.deployed_models[model_id] = model_version
+        device.status = DeviceStatus.ONLINE
+        device.last_seen_at = deployment.deployed_at
+
+        logger.info(
+            "Deployment {} complete: '{}' v{} on '{}'",
+            deployment_id,
+            model_id,
+            model_version,
+            device_id,
+        )
+        return deployment
+
+    async def sync(
+        self,
+        device_id: str,
+        config_updates: dict[str, Any] | None = None,
+    ) -> dict[str, Any]:
+        """Synchronise device configuration and state.
+
+        Args:
+            device_id: Device to sync.
+            config_updates: Optional configuration values to push.
+
+        Returns:
+            Sync result dictionary with status and applied changes.
+
+        Raises:
+            KeyError: If ``device_id`` is not found.
+        """
+        device = self._get_device(device_id)
+        await asyncio.sleep(0)
+
+        device.last_seen_at = datetime.now(timezone.utc)
+        if device.status == DeviceStatus.OFFLINE:
+            device.status = DeviceStatus.ONLINE
+
+        result: dict[str, Any] = {
+            "device_id": device_id,
+            "synced_at": device.last_seen_at.isoformat(),
+            "config_applied": bool(config_updates),
+            "deployed_models": dict(device.deployed_models),
+        }
+        logger.debug("Synced device '{}'", device_id)
+        return result
+
+    def get_online_devices(self) -> list[EdgeDevice]:
+        """Return all currently online devices.
+
+        Returns:
+            List of online :class:`EdgeDevice` objects.
+        """
+        return [d for d in self.devices.values() if d.status == DeviceStatus.ONLINE]
+
+    def _get_device(self, device_id: str) -> EdgeDevice:
+        """Retrieve a device by ID.
+
+        Args:
+            device_id: Device identifier.
+
+        Returns:
+            The :class:`EdgeDevice`.
+
+        Raises:
+            KeyError: If not found.
+        """
+        if device_id not in self.devices:
+            raise KeyError(f"Device '{device_id}' not found")
+        return self.devices[device_id]
diff --git a/edgeops/edge_nodes/federated_learning.py b/edgeops/edge_nodes/federated_learning.py
new file mode 100644
index 0000000..0ea5ff2
--- /dev/null
+++ b/edgeops/edge_nodes/federated_learning.py
@@ -0,0 +1,300 @@
+"""Federated learning coordination for distributed edge model training."""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class ClientUpdate:
+    """A model update submitted by a federated learning client.
+
+    Attributes:
+        client_id: Identifier of the contributing edge device.
+        gradients: Gradient arrays keyed by layer name.
+        n_samples: Number of local training samples.
+        local_loss: Training loss on the client's local dataset.
+        round_number: Federated round this update belongs to.
+        submitted_at: UTC submission timestamp.
+    """
+
+    client_id: str
+    gradients: dict[str, np.ndarray]
+    n_samples: int
+    local_loss: float
+    round_number: int
+    submitted_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class AggregationResult:
+    """Result of a gradient aggregation step.
+
+    Attributes:
+        round_number: Federated learning round.
+        aggregated_gradients: Sample-weighted averaged gradients.
+        participating_clients: IDs of clients included.
+        total_samples: Total training samples across all clients.
+        weighted_loss: Sample-weighted mean local loss.
+        aggregated_at: UTC timestamp.
+    """
+
+    round_number: int
+    aggregated_gradients: dict[str, np.ndarray]
+    participating_clients: list[str]
+    total_samples: int
+    weighted_loss: float
+    aggregated_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class FederatedRoundResult:
+    """Summary of a completed federated learning round.
+
+    Attributes:
+        round_number: Completed round index.
+        n_clients: Number of participating clients.
+        global_loss: Aggregated loss after this round.
+        model_version: New global model version string.
+        duration_s: Wall-clock round duration in seconds.
+    """
+
+    round_number: int
+    n_clients: int
+    global_loss: float
+    model_version: str
+    duration_s: float
+
+
+class FederatedLearning:
+    """Distributed federated learning coordinator for edge devices.
+
+    Implements FedAvg (Federated Averaging) with optional differential
+    privacy noise injection.  Coordinates rounds, aggregates gradients,
+    and distributes updated global model parameters.
+
+    Attributes:
+        current_round: Current federated round number.
+        round_history: Completed round summaries.
+        _pending_updates: Collected client updates awaiting aggregation.
+        _global_model_version: Current global model version counter.
+        _min_clients: Minimum clients required per round.
+    """
+
+    def __init__(self, min_clients: int = 3) -> None:
+        """Initialise the federated learning coordinator.
+
+        Args:
+            min_clients: Minimum number of client updates required to
+                proceed with aggregation.
+        """
+        self.current_round: int = 0
+        self.round_history: list[FederatedRoundResult] = []
+        self._pending_updates: list[ClientUpdate] = []
+        self._global_model_version: int = 0
+        self._min_clients = min_clients
+        logger.info("FederatedLearning coordinator initialised (min_clients={})", min_clients)
+
+    def submit_update(self, update: ClientUpdate) -> None:
+        """Accept a client gradient update.
+
+        Args:
+            update: Client update from a federated participant.
+
+        Raises:
+            ValueError: If ``update.round_number`` does not match the
+                current round.
+        """
+        if update.round_number != self.current_round:
+            raise ValueError(
+                f"Update is for round {update.round_number}, "
+                f"but current round is {self.current_round}"
+            )
+        self._pending_updates.append(update)
+        logger.debug(
+            "Received update from client '{}' (round={}, samples={})",
+            update.client_id,
+            update.round_number,
+            update.n_samples,
+        )
+
+    def aggregate_gradients(
+        self,
+        updates: list[ClientUpdate] | None = None,
+        *,
+        dp_noise_scale: float = 0.0,
+    ) -> AggregationResult:
+        """Aggregate client updates using FedAvg (sample-weighted mean).
+
+        Args:
+            updates: Updates to aggregate; defaults to pending buffer.
+            dp_noise_scale: Standard deviation of Gaussian noise added for
+                differential privacy (0 = no DP noise).
+
+        Returns:
+            :class:`AggregationResult` with averaged gradients.
+
+        Raises:
+            RuntimeError: If fewer than ``min_clients`` updates are available.
+        """
+        updates = updates or self._pending_updates
+        if len(updates) < self._min_clients:
+            raise RuntimeError(
+                f"Insufficient updates: {len(updates)}, need {self._min_clients}"
+            )
+
+        total_samples = sum(u.n_samples for u in updates)
+        layer_names = list(updates[0].gradients.keys())
+        aggregated: dict[str, np.ndarray] = {}
+
+        for layer in layer_names:
+            weighted_sum = sum(
+                u.gradients[layer] * u.n_samples
+                for u in updates
+                if layer in u.gradients
+            )
+            avg = weighted_sum / (total_samples + 1e-10)
+
+            if dp_noise_scale > 0:
+                rng = np.random.default_rng()
+                avg = avg + rng.normal(0, dp_noise_scale, size=avg.shape)
+
+            aggregated[layer] = avg
+
+        weighted_loss = sum(u.local_loss * u.n_samples for u in updates) / (total_samples + 1e-10)
+        result = AggregationResult(
+            round_number=self.current_round,
+            aggregated_gradients=aggregated,
+            participating_clients=[u.client_id for u in updates],
+            total_samples=total_samples,
+            weighted_loss=round(float(weighted_loss), 4),
+        )
+        logger.info(
+            "Aggregated {} clients, {} samples, weighted_loss={:.4f}",
+            len(updates),
+            total_samples,
+            weighted_loss,
+        )
+        return result
+
+    def federated_average(
+        self,
+        model_weights: list[dict[str, np.ndarray]],
+        sample_counts: list[int],
+    ) -> dict[str, np.ndarray]:
+        """Compute the sample-weighted average of model weight dictionaries.
+
+        Args:
+            model_weights: List of model weight dicts from each client.
+            sample_counts: Corresponding sample counts.
+
+        Returns:
+            Averaged model weight dictionary.
+
+        Raises:
+            ValueError: If ``model_weights`` and ``sample_counts`` lengths differ.
+        """
+        if len(model_weights) != len(sample_counts):
+            raise ValueError(
+                f"Lengths differ: {len(model_weights)} models, {len(sample_counts)} counts"
+            )
+
+        total = sum(sample_counts) + 1e-10
+        layer_names = list(model_weights[0].keys())
+        averaged: dict[str, np.ndarray] = {}
+
+        for layer in layer_names:
+            averaged[layer] = sum(
+                w[layer] * n for w, n in zip(model_weights, sample_counts)
+            ) / total
+
+        logger.debug("FedAvg computed for {} layers", len(layer_names))
+        return averaged
+
+    async def coordinate_round(
+        self,
+        client_ids: list[str],
+        simulate_updates: bool = True,
+    ) -> FederatedRoundResult:
+        """Coordinate a complete federated learning round.
+
+        Collects updates from clients, runs FedAvg, and increments the round
+        counter.
+
+        Args:
+            client_ids: List of participating client identifiers.
+            simulate_updates: Generate synthetic updates when ``True``.
+
+        Returns:
+            :class:`FederatedRoundResult` summarising the round.
+
+        Raises:
+            RuntimeError: If fewer clients than ``min_clients`` are specified.
+        """
+        if len(client_ids) < self._min_clients:
+            raise RuntimeError(
+                f"Need ≥{self._min_clients} clients, got {len(client_ids)}"
+            )
+
+        import time
+        start = time.monotonic()
+        logger.info("Starting federated round {} with {} clients", self.current_round, len(client_ids))
+
+        if simulate_updates:
+            self._pending_updates.clear()
+            for client_id in client_ids:
+                update = self._simulate_client_update(client_id)
+                self._pending_updates.append(update)
+
+        await asyncio.sleep(0)
+        aggregation = self.aggregate_gradients()
+
+        self._global_model_version += 1
+        duration = time.monotonic() - start
+
+        result = FederatedRoundResult(
+            round_number=self.current_round,
+            n_clients=len(client_ids),
+            global_loss=aggregation.weighted_loss,
+            model_version=f"global_v{self._global_model_version}",
+            duration_s=round(duration, 4),
+        )
+        self.round_history.append(result)
+        self.current_round += 1
+        self._pending_updates.clear()
+
+        logger.info(
+            "Federated round {} complete: loss={:.4f}, version={}",
+            result.round_number,
+            result.global_loss,
+            result.model_version,
+        )
+        return result
+
+    def _simulate_client_update(self, client_id: str) -> ClientUpdate:
+        """Generate a synthetic client update for testing.
+
+        Args:
+            client_id: Client identifier.
+
+        Returns:
+            Simulated :class:`ClientUpdate`.
+        """
+        rng = np.random.default_rng(seed=hash(client_id + str(self.current_round)) % (2**32))
+        return ClientUpdate(
+            client_id=client_id,
+            gradients={
+                "layer_1": rng.normal(0, 0.01, size=(64, 32)),
+                "layer_2": rng.normal(0, 0.01, size=(32, 16)),
+                "output": rng.normal(0, 0.01, size=(16, 1)),
+            },
+            n_samples=int(rng.integers(100, 1000)),
+            local_loss=float(rng.uniform(0.1, 1.0)),
+            round_number=self.current_round,
+        )
diff --git a/edgeops/edge_nodes/model_compression.py b/edgeops/edge_nodes/model_compression.py
new file mode 100644
index 0000000..42e00be
--- /dev/null
+++ b/edgeops/edge_nodes/model_compression.py
@@ -0,0 +1,254 @@
+"""Model quantisation and pruning simulation for edge deployment."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class CompressionMethod(Enum):
+    """Available model compression techniques."""
+
+    INT8_QUANTIZATION = auto()
+    INT4_QUANTIZATION = auto()
+    FP16_QUANTIZATION = auto()
+    MAGNITUDE_PRUNING = auto()
+    STRUCTURED_PRUNING = auto()
+    KNOWLEDGE_DISTILLATION = auto()
+
+
+@dataclass
+class ModelSpec:
+    """Specification of a model to be compressed.
+
+    Attributes:
+        model_id: Unique model identifier.
+        parameter_count: Total number of float32 parameters.
+        size_mb: Model size in megabytes.
+        baseline_accuracy: Accuracy before compression.
+        target_latency_ms: Target inference latency on edge device.
+    """
+
+    model_id: str
+    parameter_count: int
+    size_mb: float
+    baseline_accuracy: float
+    target_latency_ms: float = 10.0
+
+
+@dataclass
+class CompressionResult:
+    """Result of a model compression operation.
+
+    Attributes:
+        model_id: Identifier of the compressed model.
+        method: Compression technique applied.
+        original_size_mb: Size before compression.
+        compressed_size_mb: Size after compression.
+        compression_ratio: original / compressed.
+        accuracy_after: Model accuracy after compression.
+        accuracy_delta: Accuracy change (negative = degradation).
+        estimated_latency_ms: Estimated inference latency after compression.
+        meets_latency_target: Whether the latency target is met.
+        compressed_at: UTC timestamp.
+    """
+
+    model_id: str
+    method: CompressionMethod
+    original_size_mb: float
+    compressed_size_mb: float
+    compression_ratio: float
+    accuracy_after: float
+    accuracy_delta: float
+    estimated_latency_ms: float
+    meets_latency_target: bool
+    compressed_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+# Compression method characteristics (ratio_range, accuracy_penalty_range)
+_METHOD_PROFILES: dict[CompressionMethod, tuple[tuple[float, float], tuple[float, float]]] = {
+    CompressionMethod.INT8_QUANTIZATION: ((3.5, 4.5), (0.001, 0.01)),
+    CompressionMethod.INT4_QUANTIZATION: ((7.0, 9.0), (0.01, 0.05)),
+    CompressionMethod.FP16_QUANTIZATION: ((1.8, 2.2), (0.0001, 0.002)),
+    CompressionMethod.MAGNITUDE_PRUNING: ((2.0, 5.0), (0.005, 0.03)),
+    CompressionMethod.STRUCTURED_PRUNING: ((3.0, 8.0), (0.01, 0.06)),
+    CompressionMethod.KNOWLEDGE_DISTILLATION: ((4.0, 10.0), (0.005, 0.02)),
+}
+
+
+class ModelCompression:
+    """Model quantisation and pruning simulation for edge deployment.
+
+    Simulates compression operations tracking compression ratio and
+    accuracy trade-off without requiring actual model weights.
+
+    Attributes:
+        compression_history: Log of all compression results.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the model compression manager."""
+        self.compression_history: list[CompressionResult] = []
+        logger.info("ModelCompression initialised")
+
+    def quantize(
+        self,
+        model_spec: ModelSpec,
+        method: CompressionMethod = CompressionMethod.INT8_QUANTIZATION,
+        random_seed: int = 42,
+    ) -> CompressionResult:
+        """Simulate model quantisation.
+
+        Args:
+            model_spec: Specification of the model to compress.
+            method: Quantisation method to apply.
+            random_seed: Seed for reproducible simulation.
+
+        Returns:
+            :class:`CompressionResult` with simulated metrics.
+
+        Raises:
+            ValueError: If ``method`` is not a quantisation method.
+        """
+        quantisation_methods = {
+            CompressionMethod.INT8_QUANTIZATION,
+            CompressionMethod.INT4_QUANTIZATION,
+            CompressionMethod.FP16_QUANTIZATION,
+        }
+        if method not in quantisation_methods:
+            raise ValueError(
+                f"Method {method.name} is not a quantisation method. "
+                f"Use one of: {[m.name for m in quantisation_methods]}"
+            )
+        return self._compress(model_spec, method, random_seed)
+
+    def prune(
+        self,
+        model_spec: ModelSpec,
+        sparsity: float = 0.5,
+        structured: bool = False,
+        random_seed: int = 42,
+    ) -> CompressionResult:
+        """Simulate model pruning.
+
+        Args:
+            model_spec: Model specification.
+            sparsity: Fraction of weights to zero out (0–1).
+            structured: Use structured (channel) pruning if True, else
+                magnitude-based unstructured pruning.
+            random_seed: Seed for reproducible simulation.
+
+        Returns:
+            :class:`CompressionResult`.
+
+        Raises:
+            ValueError: If ``sparsity`` is not in (0, 1).
+        """
+        if not 0 < sparsity < 1:
+            raise ValueError(f"sparsity must be in (0, 1), got {sparsity}")
+
+        method = (
+            CompressionMethod.STRUCTURED_PRUNING
+            if structured
+            else CompressionMethod.MAGNITUDE_PRUNING
+        )
+        result = self._compress(model_spec, method, random_seed)
+        # Scale accuracy penalty with sparsity
+        extra_penalty = sparsity * 0.05
+        result.accuracy_after = round(
+            max(0.0, result.accuracy_after - extra_penalty), 4
+        )
+        result.accuracy_delta = round(
+            result.accuracy_after - model_spec.baseline_accuracy, 4
+        )
+        return result
+
+    def compress_pipeline(
+        self,
+        model_spec: ModelSpec,
+        methods: list[CompressionMethod],
+    ) -> list[CompressionResult]:
+        """Apply a sequence of compression techniques.
+
+        Each method is applied to the output of the previous step.
+
+        Args:
+            model_spec: Original model specification.
+            methods: Ordered list of compression methods.
+
+        Returns:
+            List of :class:`CompressionResult` for each step.
+        """
+        results: list[CompressionResult] = []
+        current_spec = model_spec
+
+        for i, method in enumerate(methods):
+            result = self._compress(current_spec, method, random_seed=i)
+            results.append(result)
+            # Update spec for next step
+            current_spec = ModelSpec(
+                model_id=current_spec.model_id,
+                parameter_count=int(current_spec.parameter_count / result.compression_ratio),
+                size_mb=result.compressed_size_mb,
+                baseline_accuracy=result.accuracy_after,
+                target_latency_ms=current_spec.target_latency_ms,
+            )
+
+        logger.info(
+            "Compression pipeline for '{}': {} steps, final ratio={:.2f}×",
+            model_spec.model_id,
+            len(methods),
+            model_spec.size_mb / results[-1].compressed_size_mb if results else 1.0,
+        )
+        return results
+
+    def _compress(
+        self,
+        model_spec: ModelSpec,
+        method: CompressionMethod,
+        random_seed: int,
+    ) -> CompressionResult:
+        """Core compression simulation.
+
+        Args:
+            model_spec: Model to compress.
+            method: Compression method.
+            random_seed: RNG seed.
+
+        Returns:
+            Simulated :class:`CompressionResult`.
+        """
+        ratio_range, penalty_range = _METHOD_PROFILES[method]
+        rng = np.random.default_rng(seed=random_seed)
+
+        ratio = float(rng.uniform(*ratio_range))
+        accuracy_penalty = float(rng.uniform(*penalty_range))
+        compressed_size = model_spec.size_mb / ratio
+        accuracy_after = max(0.0, model_spec.baseline_accuracy - accuracy_penalty)
+        estimated_latency = model_spec.target_latency_ms / ratio * 0.8  # heuristic
+
+        result = CompressionResult(
+            model_id=model_spec.model_id,
+            method=method,
+            original_size_mb=round(model_spec.size_mb, 2),
+            compressed_size_mb=round(compressed_size, 2),
+            compression_ratio=round(ratio, 2),
+            accuracy_after=round(accuracy_after, 4),
+            accuracy_delta=round(accuracy_after - model_spec.baseline_accuracy, 4),
+            estimated_latency_ms=round(estimated_latency, 2),
+            meets_latency_target=estimated_latency <= model_spec.target_latency_ms,
+        )
+        self.compression_history.append(result)
+        logger.info(
+            "Compressed '{}' with {}: ratio={:.2f}×, accuracy_delta={:+.4f}",
+            model_spec.model_id,
+            method.name,
+            ratio,
+            result.accuracy_delta,
+        )
+        return result
diff --git a/edgeops/orchestration/__init__.py b/edgeops/orchestration/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/edgeops/orchestration/__pycache__/__init__.cpython-312.pyc b/edgeops/orchestration/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..3bdd586
Binary files /dev/null and b/edgeops/orchestration/__pycache__/__init__.cpython-312.pyc differ
diff --git a/edgeops/orchestration/__pycache__/data_sync.cpython-312.pyc b/edgeops/orchestration/__pycache__/data_sync.cpython-312.pyc
new file mode 100644
index 0000000..8c0fb7e
Binary files /dev/null and b/edgeops/orchestration/__pycache__/data_sync.cpython-312.pyc differ
diff --git a/edgeops/orchestration/__pycache__/edge_coordinator.cpython-312.pyc b/edgeops/orchestration/__pycache__/edge_coordinator.cpython-312.pyc
new file mode 100644
index 0000000..00f02a4
Binary files /dev/null and b/edgeops/orchestration/__pycache__/edge_coordinator.cpython-312.pyc differ
diff --git a/edgeops/orchestration/data_sync.py b/edgeops/orchestration/data_sync.py
new file mode 100644
index 0000000..536aa49
--- /dev/null
+++ b/edgeops/orchestration/data_sync.py
@@ -0,0 +1,307 @@
+"""Edge-to-cloud data synchronisation with conflict resolution."""
+
+from __future__ import annotations
+
+import asyncio
+import hashlib
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+from loguru import logger
+
+
+class ConflictStrategy(Enum):
+    """Conflict resolution strategies for concurrent updates."""
+
+    LAST_WRITE_WINS = auto()    # Most recent timestamp wins
+    SERVER_WINS = auto()        # Cloud/server version always wins
+    CLIENT_WINS = auto()        # Edge/client version always wins
+    MERGE = auto()              # Attempt automatic field-level merge
+
+
+@dataclass
+class DataRecord:
+    """A versioned data record subject to synchronisation.
+
+    Attributes:
+        record_id: Unique identifier.
+        data: Record payload.
+        version: Monotonically increasing version counter.
+        updated_at: UTC timestamp of last update.
+        checksum: SHA-256 checksum of serialised data.
+        source: ``"edge"`` or ``"cloud"``.
+    """
+
+    record_id: str
+    data: Any
+    version: int
+    updated_at: datetime
+    checksum: str
+    source: str = "edge"
+
+    @classmethod
+    def create(cls, record_id: str, data: Any, source: str = "edge") -> "DataRecord":
+        """Create a new DataRecord with computed checksum.
+
+        Args:
+            record_id: Record identifier.
+            data: Record payload.
+            source: Originating source.
+
+        Returns:
+            New :class:`DataRecord`.
+        """
+        checksum = hashlib.sha256(str(data).encode()).hexdigest()[:16]
+        return cls(
+            record_id=record_id,
+            data=data,
+            version=1,
+            updated_at=datetime.now(timezone.utc),
+            checksum=checksum,
+            source=source,
+        )
+
+
+@dataclass
+class SyncResult:
+    """Result of a synchronisation operation.
+
+    Attributes:
+        synced_records: IDs of successfully synced records.
+        conflicts_resolved: IDs of records where conflicts were resolved.
+        failed_records: IDs of records that failed to sync.
+        bytes_transferred: Estimated bytes transferred.
+        duration_ms: Sync operation duration.
+        sync_at: UTC timestamp.
+    """
+
+    synced_records: list[str]
+    conflicts_resolved: list[str]
+    failed_records: list[str]
+    bytes_transferred: int
+    duration_ms: float
+    sync_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+    @property
+    def success_rate(self) -> float:
+        """Fraction of records synced successfully."""
+        total = len(self.synced_records) + len(self.failed_records)
+        return len(self.synced_records) / total if total > 0 else 1.0
+
+
+class DataSync:
+    """Edge-to-cloud data synchronisation with conflict resolution.
+
+    Maintains local and remote record stores, tracks sync state,
+    and implements configurable conflict resolution strategies.
+
+    Attributes:
+        local_store: Edge-side data records keyed by record_id.
+        remote_store: Cloud-side data records keyed by record_id.
+        conflict_log: History of resolved conflicts.
+        sync_history: History of sync operations.
+        _strategy: Conflict resolution strategy.
+    """
+
+    def __init__(self, strategy: ConflictStrategy = ConflictStrategy.LAST_WRITE_WINS) -> None:
+        """Initialise the data sync manager.
+
+        Args:
+            strategy: Conflict resolution strategy.
+        """
+        self.local_store: dict[str, DataRecord] = {}
+        self.remote_store: dict[str, DataRecord] = {}
+        self.conflict_log: list[dict[str, Any]] = []
+        self.sync_history: list[SyncResult] = []
+        self._strategy = strategy
+        logger.info("DataSync initialised (strategy={})", strategy.name)
+
+    def upsert_local(self, record_id: str, data: Any) -> DataRecord:
+        """Create or update a record in the local (edge) store.
+
+        Args:
+            record_id: Record identifier.
+            data: Record payload.
+
+        Returns:
+            Created or updated :class:`DataRecord`.
+        """
+        existing = self.local_store.get(record_id)
+        if existing:
+            checksum = hashlib.sha256(str(data).encode()).hexdigest()[:16]
+            record = DataRecord(
+                record_id=record_id,
+                data=data,
+                version=existing.version + 1,
+                updated_at=datetime.now(timezone.utc),
+                checksum=checksum,
+                source="edge",
+            )
+        else:
+            record = DataRecord.create(record_id, data, source="edge")
+        self.local_store[record_id] = record
+        return record
+
+    async def sync(
+        self,
+        record_ids: list[str] | None = None,
+    ) -> SyncResult:
+        """Synchronise local records to the remote store.
+
+        Performs an incremental sync of records that differ from the
+        remote version.  Conflicts are resolved using ``self._strategy``.
+
+        Args:
+            record_ids: Subset of records to sync; syncs all if ``None``.
+
+        Returns:
+            :class:`SyncResult` summarising the operation.
+        """
+        import time
+        start = time.monotonic()
+
+        targets = record_ids or list(self.local_store.keys())
+        synced: list[str] = []
+        conflicts: list[str] = []
+        failed: list[str] = []
+        bytes_tx = 0
+
+        for record_id in targets:
+            try:
+                local = self.local_store.get(record_id)
+                if local is None:
+                    logger.debug("Record '{}' not in local store, skipping", record_id)
+                    continue
+
+                remote = self.remote_store.get(record_id)
+                resolved = self._resolve(local, remote)
+
+                if resolved is None:
+                    # No change needed
+                    synced.append(record_id)
+                    continue
+
+                if remote and resolved.checksum != local.checksum and resolved.checksum != (remote.checksum if remote else ""):
+                    conflicts.append(record_id)
+
+                await asyncio.sleep(0)
+                self.remote_store[record_id] = resolved
+                bytes_tx += len(str(resolved.data).encode())
+                synced.append(record_id)
+
+            except Exception as exc:
+                logger.error("Sync failed for record '{}': {}", record_id, exc)
+                failed.append(record_id)
+
+        duration_ms = (time.monotonic() - start) * 1000
+        result = SyncResult(
+            synced_records=synced,
+            conflicts_resolved=conflicts,
+            failed_records=failed,
+            bytes_transferred=bytes_tx,
+            duration_ms=round(duration_ms, 2),
+        )
+        self.sync_history.append(result)
+        logger.info(
+            "Sync complete: {}/{} records, {} conflicts, {} failed, {} bytes",
+            len(synced),
+            len(targets),
+            len(conflicts),
+            len(failed),
+            bytes_tx,
+        )
+        return result
+
+    async def pull(self, record_ids: list[str] | None = None) -> int:
+        """Pull updates from the remote store to local.
+
+        Args:
+            record_ids: Records to pull; all remote records if ``None``.
+
+        Returns:
+            Number of records updated locally.
+        """
+        await asyncio.sleep(0)
+        targets = record_ids or list(self.remote_store.keys())
+        updated = 0
+
+        for record_id in targets:
+            remote = self.remote_store.get(record_id)
+            if remote is None:
+                continue
+            local = self.local_store.get(record_id)
+            if local is None or remote.version > local.version:
+                self.local_store[record_id] = remote
+                updated += 1
+
+        logger.debug("Pull complete: {} records updated", updated)
+        return updated
+
+    def _resolve(
+        self,
+        local: DataRecord,
+        remote: DataRecord | None,
+    ) -> DataRecord | None:
+        """Resolve a potential conflict between local and remote records.
+
+        Args:
+            local: Local record.
+            remote: Remote record (may be ``None`` if first sync).
+
+        Returns:
+            The record to write to remote, or ``None`` if no update needed.
+        """
+        if remote is None:
+            return local  # New record — always push
+
+        if local.checksum == remote.checksum:
+            return None  # Identical — no sync needed
+
+        # Conflict detected
+        self.conflict_log.append({
+            "record_id": local.record_id,
+            "local_version": local.version,
+            "remote_version": remote.version,
+            "strategy": self._strategy.name,
+            "resolved_at": datetime.now(timezone.utc).isoformat(),
+        })
+
+        if self._strategy == ConflictStrategy.LAST_WRITE_WINS:
+            return local if local.updated_at >= remote.updated_at else remote
+        elif self._strategy == ConflictStrategy.SERVER_WINS:
+            return remote
+        elif self._strategy == ConflictStrategy.CLIENT_WINS:
+            return local
+        elif self._strategy == ConflictStrategy.MERGE:
+            return self._merge(local, remote)
+
+        return local  # Default fallback
+
+    def _merge(self, local: DataRecord, remote: DataRecord) -> DataRecord:
+        """Attempt a simple field-level merge of two records.
+
+        Merges dict payloads by taking the most-recently-updated value
+        for each conflicting key.
+
+        Args:
+            local: Local record.
+            remote: Remote record.
+
+        Returns:
+            Merged :class:`DataRecord`.
+        """
+        if isinstance(local.data, dict) and isinstance(remote.data, dict):
+            merged_data = {**remote.data}
+            if local.updated_at >= remote.updated_at:
+                merged_data.update(local.data)
+        else:
+            # Non-dict: fall back to last-write-wins
+            merged_data = local.data if local.updated_at >= remote.updated_at else remote.data
+
+        return DataRecord.create(
+            local.record_id,
+            merged_data,
+            source="merged",
+        )
diff --git a/edgeops/orchestration/edge_coordinator.py b/edgeops/orchestration/edge_coordinator.py
new file mode 100644
index 0000000..bf25b13
--- /dev/null
+++ b/edgeops/orchestration/edge_coordinator.py
@@ -0,0 +1,310 @@
+"""Multi-edge coordination with topology management and task distribution."""
+
+from __future__ import annotations
+
+import asyncio
+import uuid
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any, Callable, Awaitable
+
+import numpy as np
+from loguru import logger
+
+
+class NodeRole(Enum):
+    """Role of an edge node in the topology."""
+
+    PRIMARY = auto()
+    SECONDARY = auto()
+    GATEWAY = auto()
+    LEAF = auto()
+
+
+@dataclass
+class EdgeNode:
+    """An edge node in the coordinator's topology.
+
+    Attributes:
+        node_id: Unique identifier.
+        address: Network address (host:port).
+        role: Node role in the topology.
+        capacity: Normalised capacity score (0–1).
+        current_load: Normalised current load (0–1).
+        tags: Classification tags.
+        registered_at: UTC registration timestamp.
+        last_heartbeat: UTC last heartbeat timestamp.
+        online: Whether the node is reachable.
+    """
+
+    node_id: str
+    address: str
+    role: NodeRole
+    capacity: float
+    current_load: float = 0.0
+    tags: list[str] = field(default_factory=list)
+    registered_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    last_heartbeat: datetime | None = None
+    online: bool = True
+
+    @property
+    def available_capacity(self) -> float:
+        """Available capacity (capacity − current_load)."""
+        return max(0.0, self.capacity - self.current_load)
+
+
+@dataclass
+class DistributedTask:
+    """A task to be distributed across edge nodes.
+
+    Attributes:
+        task_id: Unique identifier.
+        task_type: Category/type label.
+        payload: Task input data.
+        required_capacity: Minimum available capacity needed.
+        affinity_tags: Preferred node tags.
+        timeout_s: Task execution deadline in seconds.
+    """
+
+    task_id: str
+    task_type: str
+    payload: Any
+    required_capacity: float = 0.1
+    affinity_tags: list[str] = field(default_factory=list)
+    timeout_s: float = 30.0
+
+
+@dataclass
+class TaskResult:
+    """Result of a distributed task execution.
+
+    Attributes:
+        task_id: Corresponding task identifier.
+        node_id: Node that executed the task.
+        success: Whether execution succeeded.
+        result: Task output.
+        latency_ms: Execution time.
+        executed_at: UTC timestamp.
+    """
+
+    task_id: str
+    node_id: str
+    success: bool
+    result: Any
+    latency_ms: float
+    executed_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class EdgeCoordinator:
+    """Multi-edge node coordinator with topology and task distribution.
+
+    Manages an overlay network of edge nodes, performs health-aware
+    task routing, and provides topology views.
+
+    Attributes:
+        nodes: Registered nodes keyed by node_id.
+        task_history: Completed task results.
+        _routing_strategy: Task routing strategy (``"least_loaded"`` or ``"round_robin"``).
+        _rr_index: Round-robin counter.
+    """
+
+    def __init__(self, routing_strategy: str = "least_loaded") -> None:
+        """Initialise the edge coordinator.
+
+        Args:
+            routing_strategy: ``"least_loaded"`` or ``"round_robin"``.
+
+        Raises:
+            ValueError: If ``routing_strategy`` is unknown.
+        """
+        valid_strategies = {"least_loaded", "round_robin"}
+        if routing_strategy not in valid_strategies:
+            raise ValueError(
+                f"routing_strategy must be one of {valid_strategies}, got '{routing_strategy}'"
+            )
+
+        self.nodes: dict[str, EdgeNode] = {}
+        self.task_history: list[TaskResult] = []
+        self._routing_strategy = routing_strategy
+        self._rr_index = 0
+        logger.info("EdgeCoordinator initialised (strategy='{}')", routing_strategy)
+
+    def register_node(
+        self,
+        address: str,
+        role: NodeRole = NodeRole.SECONDARY,
+        capacity: float = 1.0,
+        tags: list[str] | None = None,
+    ) -> EdgeNode:
+        """Register an edge node in the topology.
+
+        Args:
+            address: Network address string.
+            role: Node role.
+            capacity: Normalised capacity (0–1).
+            tags: Classification tags.
+
+        Returns:
+            The registered :class:`EdgeNode`.
+
+        Raises:
+            ValueError: If ``capacity`` is not in (0, 1].
+        """
+        if not 0 < capacity <= 1.0:
+            raise ValueError(f"capacity must be in (0, 1], got {capacity}")
+
+        node_id = f"node_{uuid.uuid4().hex[:8]}"
+        node = EdgeNode(
+            node_id=node_id,
+            address=address,
+            role=role,
+            capacity=capacity,
+            tags=tags or [],
+        )
+        self.nodes[node_id] = node
+        logger.info("Edge node registered: {} @ {} (role={})", node_id, address, role.name)
+        return node
+
+    def route_task(self, task: DistributedTask) -> EdgeNode | None:
+        """Select the best node for a task using the routing strategy.
+
+        Args:
+            task: Task requiring routing.
+
+        Returns:
+            Selected :class:`EdgeNode`, or ``None`` if no suitable node found.
+        """
+        candidates = [
+            n for n in self.nodes.values()
+            if n.online and n.available_capacity >= task.required_capacity
+        ]
+
+        if task.affinity_tags:
+            preferred = [
+                n for n in candidates
+                if any(tag in n.tags for tag in task.affinity_tags)
+            ]
+            if preferred:
+                candidates = preferred
+
+        if not candidates:
+            logger.warning("No suitable nodes for task '{}' (required_capacity={})", task.task_id, task.required_capacity)
+            return None
+
+        if self._routing_strategy == "least_loaded":
+            return min(candidates, key=lambda n: n.current_load)
+        else:  # round_robin
+            node = candidates[self._rr_index % len(candidates)]
+            self._rr_index += 1
+            return node
+
+    async def distribute_task(
+        self,
+        task: DistributedTask,
+        executor: Callable[[EdgeNode, DistributedTask], Awaitable[Any]] | None = None,
+    ) -> TaskResult:
+        """Distribute and execute a task on the best available node.
+
+        Args:
+            task: Task to distribute.
+            executor: Async callable ``(node, task) → result``.  Uses a
+                simulated executor when ``None``.
+
+        Returns:
+            :class:`TaskResult` from the executing node.
+
+        Raises:
+            RuntimeError: If no suitable node is available.
+        """
+        node = self.route_task(task)
+        if node is None:
+            raise RuntimeError(f"No suitable node for task '{task.task_id}'")
+
+        import time
+        start = time.monotonic()
+        node.current_load = min(1.0, node.current_load + task.required_capacity)
+
+        try:
+            exec_fn = executor or self._default_executor
+            result_data = await asyncio.wait_for(
+                exec_fn(node, task), timeout=task.timeout_s
+            )
+            success = True
+        except Exception as exc:
+            result_data = str(exc)
+            success = False
+            logger.error("Task '{}' failed on node '{}': {}", task.task_id, node.node_id, exc)
+        finally:
+            node.current_load = max(0.0, node.current_load - task.required_capacity)
+
+        latency_ms = (time.monotonic() - start) * 1000
+        tr = TaskResult(
+            task_id=task.task_id,
+            node_id=node.node_id,
+            success=success,
+            result=result_data,
+            latency_ms=round(latency_ms, 2),
+        )
+        self.task_history.append(tr)
+        logger.debug("Task '{}' → node '{}': {} ({:.1f}ms)", task.task_id, node.node_id, "OK" if success else "FAIL", latency_ms)
+        return tr
+
+    async def broadcast(
+        self,
+        payload: Any,
+        node_ids: list[str] | None = None,
+    ) -> dict[str, bool]:
+        """Broadcast a payload to all (or specified) online nodes.
+
+        Args:
+            payload: Data to broadcast.
+            node_ids: Subset of node IDs to target; all online nodes if None.
+
+        Returns:
+            Mapping of node_id to delivery success flag.
+        """
+        targets = (
+            [self.nodes[nid] for nid in node_ids if nid in self.nodes]
+            if node_ids
+            else [n for n in self.nodes.values() if n.online]
+        )
+
+        async def _send(node: EdgeNode) -> tuple[str, bool]:
+            await asyncio.sleep(0)
+            return node.node_id, True
+
+        results_list = await asyncio.gather(*[_send(n) for n in targets])
+        results = dict(results_list)
+        logger.debug("Broadcast to {} nodes", len(results))
+        return results
+
+    async def _default_executor(self, node: EdgeNode, task: DistributedTask) -> Any:
+        """Simulated task executor.
+
+        Args:
+            node: Executing node.
+            task: Task to execute.
+
+        Returns:
+            Simulated result string.
+        """
+        await asyncio.sleep(0)
+        return f"result:{task.task_id}@{node.node_id}"
+
+    def topology_summary(self) -> dict[str, Any]:
+        """Return a summary of the current topology.
+
+        Returns:
+            Dictionary with node counts, load distribution, and role counts.
+        """
+        online = [n for n in self.nodes.values() if n.online]
+        loads = [n.current_load for n in online]
+        return {
+            "total_nodes": len(self.nodes),
+            "online_nodes": len(online),
+            "mean_load": round(float(np.mean(loads)), 4) if loads else 0.0,
+            "max_load": round(float(np.max(loads)), 4) if loads else 0.0,
+            "roles": {role.name: sum(1 for n in self.nodes.values() if n.role == role)
+                      for role in NodeRole},
+        }
diff --git a/edgeops/streaming/__init__.py b/edgeops/streaming/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/edgeops/streaming/__pycache__/__init__.cpython-312.pyc b/edgeops/streaming/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..221c01a
Binary files /dev/null and b/edgeops/streaming/__pycache__/__init__.cpython-312.pyc differ
diff --git a/edgeops/streaming/__pycache__/edge_cache.cpython-312.pyc b/edgeops/streaming/__pycache__/edge_cache.cpython-312.pyc
new file mode 100644
index 0000000..0f9c6b0
Binary files /dev/null and b/edgeops/streaming/__pycache__/edge_cache.cpython-312.pyc differ
diff --git a/edgeops/streaming/__pycache__/real_time_inference.cpython-312.pyc b/edgeops/streaming/__pycache__/real_time_inference.cpython-312.pyc
new file mode 100644
index 0000000..eb3a94f
Binary files /dev/null and b/edgeops/streaming/__pycache__/real_time_inference.cpython-312.pyc differ
diff --git a/edgeops/streaming/__pycache__/stream_processor.cpython-312.pyc b/edgeops/streaming/__pycache__/stream_processor.cpython-312.pyc
new file mode 100644
index 0000000..e552c67
Binary files /dev/null and b/edgeops/streaming/__pycache__/stream_processor.cpython-312.pyc differ
diff --git a/edgeops/streaming/edge_cache.py b/edgeops/streaming/edge_cache.py
new file mode 100644
index 0000000..49f909e
--- /dev/null
+++ b/edgeops/streaming/edge_cache.py
@@ -0,0 +1,215 @@
+"""Edge data cache with TTL expiry and LRU eviction."""
+
+from __future__ import annotations
+
+import asyncio
+import time
+from collections import OrderedDict
+from dataclasses import dataclass, field
+from typing import Any, Generic, TypeVar
+
+from loguru import logger
+
+
+T = TypeVar("T")
+
+
+@dataclass
+class CacheEntry:
+    """A single cache entry with TTL metadata.
+
+    Attributes:
+        key: Cache key.
+        value: Stored value.
+        ttl_s: Time-to-live in seconds (None = never expires).
+        created_at: Monotonic creation timestamp.
+        last_accessed_at: Monotonic last-access timestamp.
+        hit_count: Number of times this entry has been read.
+    """
+
+    key: str
+    value: Any
+    ttl_s: float | None
+    created_at: float = field(default_factory=time.monotonic)
+    last_accessed_at: float = field(default_factory=time.monotonic)
+    hit_count: int = 0
+
+    @property
+    def is_expired(self) -> bool:
+        """Whether this entry has exceeded its TTL."""
+        if self.ttl_s is None:
+            return False
+        return (time.monotonic() - self.created_at) > self.ttl_s
+
+
+class EdgeCache:
+    """Local edge data cache with TTL expiry and LRU eviction.
+
+    Implements an async-safe, bounded LRU cache with optional per-entry
+    TTL.  Expired entries are lazily evicted on access and eagerly
+    evicted during ``purge_expired()``.
+
+    Attributes:
+        _store: Ordered dict acting as LRU store (most-recently-used last).
+        _max_size: Maximum number of entries before LRU eviction.
+        _default_ttl_s: Default TTL when none is specified per entry.
+        _hits: Cache hit counter.
+        _misses: Cache miss counter.
+        _evictions: LRU eviction counter.
+    """
+
+    def __init__(
+        self,
+        max_size: int = 1_000,
+        default_ttl_s: float | None = 300.0,
+    ) -> None:
+        """Initialise the edge cache.
+
+        Args:
+            max_size: Maximum number of cached entries.
+            default_ttl_s: Default TTL in seconds (None = no expiry).
+
+        Raises:
+            ValueError: If ``max_size`` < 1.
+        """
+        if max_size < 1:
+            raise ValueError(f"max_size must be ≥1, got {max_size}")
+
+        self._store: OrderedDict[str, CacheEntry] = OrderedDict()
+        self._max_size = max_size
+        self._default_ttl_s = default_ttl_s
+        self._hits = 0
+        self._misses = 0
+        self._evictions = 0
+        logger.info("EdgeCache initialised (max_size={}, default_ttl={}s)", max_size, default_ttl_s)
+
+    async def get(self, key: str) -> Any | None:
+        """Retrieve a cached value by key.
+
+        Expired entries are evicted on access and treated as misses.
+
+        Args:
+            key: Cache key.
+
+        Returns:
+            Cached value, or ``None`` if not found or expired.
+        """
+        await asyncio.sleep(0)
+
+        entry = self._store.get(key)
+        if entry is None:
+            self._misses += 1
+            return None
+
+        if entry.is_expired:
+            self._evict(key)
+            self._misses += 1
+            logger.debug("Cache miss (expired): '{}'", key)
+            return None
+
+        # LRU: move to end (most recently used)
+        self._store.move_to_end(key)
+        entry.last_accessed_at = time.monotonic()
+        entry.hit_count += 1
+        self._hits += 1
+        logger.debug("Cache hit: '{}'", key)
+        return entry.value
+
+    async def set(
+        self,
+        key: str,
+        value: Any,
+        ttl_s: float | None = ...,  # type: ignore[assignment]
+    ) -> None:
+        """Store a value in the cache.
+
+        Args:
+            key: Cache key.
+            value: Value to cache.
+            ttl_s: TTL in seconds; uses ``default_ttl_s`` when omitted,
+                or ``None`` for no expiry.
+        """
+        await asyncio.sleep(0)
+
+        effective_ttl = self._default_ttl_s if ttl_s is ... else ttl_s
+
+        entry = CacheEntry(key=key, value=value, ttl_s=effective_ttl)
+
+        if key in self._store:
+            self._store.move_to_end(key)
+        elif len(self._store) >= self._max_size:
+            # Evict LRU (first item)
+            oldest_key, _ = next(iter(self._store.items()))
+            self._evict(oldest_key)
+
+        self._store[key] = entry
+        logger.debug("Cache set: '{}' (ttl={}s)", key, effective_ttl)
+
+    async def delete(self, key: str) -> bool:
+        """Remove a key from the cache.
+
+        Args:
+            key: Cache key to remove.
+
+        Returns:
+            ``True`` if the key existed and was removed.
+        """
+        await asyncio.sleep(0)
+        if key in self._store:
+            del self._store[key]
+            logger.debug("Cache delete: '{}'", key)
+            return True
+        return False
+
+    async def purge_expired(self) -> int:
+        """Eagerly remove all expired entries.
+
+        Returns:
+            Number of entries purged.
+        """
+        await asyncio.sleep(0)
+        expired_keys = [k for k, v in self._store.items() if v.is_expired]
+        for key in expired_keys:
+            self._evict(key)
+        if expired_keys:
+            logger.info("Purged {} expired cache entries", len(expired_keys))
+        return len(expired_keys)
+
+    async def clear(self) -> int:
+        """Remove all entries from the cache.
+
+        Returns:
+            Number of entries removed.
+        """
+        await asyncio.sleep(0)
+        count = len(self._store)
+        self._store.clear()
+        logger.info("Cache cleared ({} entries removed)", count)
+        return count
+
+    def stats(self) -> dict[str, Any]:
+        """Return cache performance statistics.
+
+        Returns:
+            Dictionary with hit/miss/eviction counts and hit rate.
+        """
+        total = self._hits + self._misses
+        hit_rate = self._hits / total if total > 0 else 0.0
+        return {
+            "size": len(self._store),
+            "max_size": self._max_size,
+            "hits": self._hits,
+            "misses": self._misses,
+            "evictions": self._evictions,
+            "hit_rate": round(hit_rate, 4),
+        }
+
+    def _evict(self, key: str) -> None:
+        """Remove an entry and increment the eviction counter.
+
+        Args:
+            key: Key to evict.
+        """
+        if key in self._store:
+            del self._store[key]
+            self._evictions += 1
diff --git a/edgeops/streaming/real_time_inference.py b/edgeops/streaming/real_time_inference.py
new file mode 100644
index 0000000..0f35c91
--- /dev/null
+++ b/edgeops/streaming/real_time_inference.py
@@ -0,0 +1,224 @@
+"""Ultra-low latency async inference engine for edge deployments."""
+
+from __future__ import annotations
+
+import asyncio
+import time
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any, Callable, Awaitable
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class InferenceRequest:
+    """A single inference request.
+
+    Attributes:
+        request_id: Unique identifier.
+        payload: Input features as a numpy array.
+        model_id: Target model identifier.
+        priority: Request priority (higher = more urgent).
+        max_latency_ms: Hard latency deadline; raises TimeoutError if exceeded.
+        submitted_at: UTC submission timestamp.
+    """
+
+    request_id: str
+    payload: np.ndarray
+    model_id: str
+    priority: int = 0
+    max_latency_ms: float = 50.0
+    submitted_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+@dataclass
+class InferenceResponse:
+    """Result of a completed inference request.
+
+    Attributes:
+        request_id: Corresponding request identifier.
+        model_id: Model that produced the result.
+        output: Inference output array.
+        latency_ms: Actual end-to-end latency.
+        timed_out: Whether the request exceeded its deadline.
+        completed_at: UTC completion timestamp.
+    """
+
+    request_id: str
+    model_id: str
+    output: np.ndarray
+    latency_ms: float
+    timed_out: bool = False
+    completed_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+# Type alias for an async inference backend
+InferenceBackend = Callable[[InferenceRequest], Awaitable[np.ndarray]]
+
+
+class RealTimeInference:
+    """Ultra-low latency async inference engine with deadline enforcement.
+
+    Dispatches inference requests to registered model backends with
+    per-request timeout controls.  Tracks latency statistics and
+    maintains an SLA compliance counter.
+
+    Attributes:
+        backends: Registered inference backends keyed by model_id.
+        latency_stats: Per-model latency history.
+        sla_violations: Count of SLA deadline violations per model.
+        _timeout_default_ms: Default deadline when none is specified.
+    """
+
+    def __init__(self, default_timeout_ms: float = 50.0) -> None:
+        """Initialise the real-time inference engine.
+
+        Args:
+            default_timeout_ms: Default request timeout in milliseconds.
+        """
+        self.backends: dict[str, InferenceBackend] = {}
+        self.latency_stats: dict[str, list[float]] = {}
+        self.sla_violations: dict[str, int] = {}
+        self._timeout_default_ms = default_timeout_ms
+        logger.info("RealTimeInference engine initialised (default_timeout={}ms)", default_timeout_ms)
+
+    def register_backend(self, model_id: str, backend: InferenceBackend) -> None:
+        """Register an inference backend for a model.
+
+        Args:
+            model_id: Model identifier.
+            backend: Async callable accepting a request, returning output array.
+        """
+        self.backends[model_id] = backend
+        self.latency_stats[model_id] = []
+        self.sla_violations[model_id] = 0
+        logger.info("Backend registered for model '{}'", model_id)
+
+    async def infer(self, request: InferenceRequest) -> InferenceResponse:
+        """Execute a single inference request with deadline enforcement.
+
+        Args:
+            request: Inference request with payload and deadline.
+
+        Returns:
+            :class:`InferenceResponse` with result and latency.
+
+        Raises:
+            KeyError: If no backend is registered for ``request.model_id``.
+        """
+        if request.model_id not in self.backends:
+            raise KeyError(
+                f"No backend registered for model '{request.model_id}'. "
+                "Call register_backend() first."
+            )
+
+        backend = self.backends[request.model_id]
+        deadline_s = (request.max_latency_ms or self._timeout_default_ms) / 1000.0
+        start = time.monotonic()
+        timed_out = False
+        output: np.ndarray
+
+        try:
+            output = await asyncio.wait_for(backend(request), timeout=deadline_s)
+        except asyncio.TimeoutError:
+            timed_out = True
+            output = np.array([])
+            self.sla_violations[request.model_id] += 1
+            logger.warning(
+                "SLA violation: request '{}' exceeded {}ms deadline",
+                request.request_id,
+                request.max_latency_ms,
+            )
+
+        latency_ms = (time.monotonic() - start) * 1000
+        self.latency_stats[request.model_id].append(latency_ms)
+
+        return InferenceResponse(
+            request_id=request.request_id,
+            model_id=request.model_id,
+            output=output,
+            latency_ms=round(latency_ms, 3),
+            timed_out=timed_out,
+        )
+
+    async def batch_infer(
+        self,
+        requests: list[InferenceRequest],
+    ) -> list[InferenceResponse]:
+        """Execute multiple inference requests concurrently.
+
+        Args:
+            requests: List of inference requests (may target different models).
+
+        Returns:
+            List of :class:`InferenceResponse` in the same order.
+
+        Raises:
+            ValueError: If ``requests`` is empty.
+        """
+        if not requests:
+            raise ValueError("requests must not be empty")
+
+        # Sort by priority (highest first) within each model
+        sorted_requests = sorted(requests, key=lambda r: -r.priority)
+        responses = await asyncio.gather(*[self.infer(r) for r in sorted_requests])
+
+        # Restore original order
+        id_to_response = {r.request_id: r for r in responses}
+        return [id_to_response[req.request_id] for req in requests]
+
+    def latency_percentiles(self, model_id: str) -> dict[str, float]:
+        """Compute latency percentiles for a model.
+
+        Args:
+            model_id: Model identifier.
+
+        Returns:
+            Dictionary with p50, p95, p99, mean, and max latencies.
+
+        Raises:
+            KeyError: If no latency data for the model.
+            ValueError: If no requests have been processed.
+        """
+        if model_id not in self.latency_stats:
+            raise KeyError(f"No stats for model '{model_id}'")
+
+        data = self.latency_stats[model_id]
+        if not data:
+            raise ValueError(f"No latency data recorded for '{model_id}'")
+
+        arr = np.asarray(data)
+        return {
+            "p50_ms": round(float(np.percentile(arr, 50)), 3),
+            "p95_ms": round(float(np.percentile(arr, 95)), 3),
+            "p99_ms": round(float(np.percentile(arr, 99)), 3),
+            "mean_ms": round(float(np.mean(arr)), 3),
+            "max_ms": round(float(np.max(arr)), 3),
+            "n_requests": len(data),
+            "sla_violations": self.sla_violations.get(model_id, 0),
+        }
+
+    @staticmethod
+    def make_simulated_backend(
+        model_id: str,
+        base_latency_ms: float = 2.0,
+        output_shape: tuple[int, ...] = (1,),
+    ) -> InferenceBackend:
+        """Factory for a simulated inference backend.
+
+        Args:
+            model_id: Model identifier label.
+            base_latency_ms: Simulated processing time.
+            output_shape: Shape of the output array.
+
+        Returns:
+            Async callable suitable for :meth:`register_backend`.
+        """
+        async def _backend(request: InferenceRequest) -> np.ndarray:
+            await asyncio.sleep(base_latency_ms / 1000.0)
+            rng = np.random.default_rng(seed=hash(request.request_id) % (2**32))
+            return rng.uniform(-1, 1, size=output_shape).astype(np.float32)
+
+        return _backend
diff --git a/edgeops/streaming/stream_processor.py b/edgeops/streaming/stream_processor.py
new file mode 100644
index 0000000..7bb9e1a
--- /dev/null
+++ b/edgeops/streaming/stream_processor.py
@@ -0,0 +1,217 @@
+"""Event stream processing with filtering, aggregation, and windowing."""
+
+from __future__ import annotations
+
+import asyncio
+import time
+from collections import deque
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any, Callable
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class StreamEvent:
+    """A single event in the data stream.
+
+    Attributes:
+        event_id: Unique identifier.
+        topic: Event topic/stream name.
+        payload: Event data dictionary.
+        timestamp: Event creation time (monotonic seconds).
+        partition_key: Optional key for partitioned processing.
+    """
+
+    event_id: str
+    topic: str
+    payload: dict[str, Any]
+    timestamp: float = field(default_factory=time.monotonic)
+    partition_key: str = ""
+
+
+@dataclass
+class WindowResult:
+    """Result of a windowed aggregation.
+
+    Attributes:
+        topic: Source topic.
+        window_start: Window start time (monotonic).
+        window_end: Window end time (monotonic).
+        n_events: Number of events in the window.
+        aggregations: Computed aggregation values.
+    """
+
+    topic: str
+    window_start: float
+    window_end: float
+    n_events: int
+    aggregations: dict[str, Any]
+
+
+# Type aliases
+FilterFn = Callable[[StreamEvent], bool]
+AggregatorFn = Callable[[list[StreamEvent]], dict[str, Any]]
+
+
+class StreamProcessor:
+    """Event stream processing with filtering, aggregation, and windowing.
+
+    Supports registering named topics, per-topic filter chains,
+    tumbling window aggregations, and async event processing.
+
+    Attributes:
+        topics: Registered topic names and their event buffers.
+        _filters: Per-topic filter functions.
+        _aggregators: Per-topic aggregation functions.
+        _window_size_s: Default tumbling window size in seconds.
+        _processed_count: Total processed event count.
+    """
+
+    def __init__(self, window_size_s: float = 60.0, buffer_size: int = 10_000) -> None:
+        """Initialise the stream processor.
+
+        Args:
+            window_size_s: Default tumbling window size in seconds.
+            buffer_size: Maximum events retained per topic.
+        """
+        self.topics: dict[str, deque[StreamEvent]] = {}
+        self._filters: dict[str, list[FilterFn]] = {}
+        self._aggregators: dict[str, AggregatorFn] = {}
+        self._window_size_s = window_size_s
+        self._buffer_size = buffer_size
+        self._processed_count = 0
+        logger.info("StreamProcessor initialised (window={}s)", window_size_s)
+
+    def register_topic(
+        self,
+        topic: str,
+        filter_fn: FilterFn | None = None,
+        aggregator_fn: AggregatorFn | None = None,
+    ) -> None:
+        """Register a new event topic.
+
+        Args:
+            topic: Topic name.
+            filter_fn: Optional filter; events returning False are discarded.
+            aggregator_fn: Optional aggregation function for window results.
+
+        Raises:
+            ValueError: If ``topic`` is already registered.
+        """
+        if topic in self.topics:
+            raise ValueError(f"Topic '{topic}' already registered")
+
+        self.topics[topic] = deque(maxlen=self._buffer_size)
+        self._filters[topic] = [filter_fn] if filter_fn else []
+        self._aggregators[topic] = aggregator_fn or self._default_aggregator
+        logger.debug("Topic '{}' registered", topic)
+
+    def add_filter(self, topic: str, filter_fn: FilterFn) -> None:
+        """Add a filter function to an existing topic.
+
+        Args:
+            topic: Target topic.
+            filter_fn: Filter function to append.
+
+        Raises:
+            KeyError: If topic is not registered.
+        """
+        if topic not in self.topics:
+            raise KeyError(f"Topic '{topic}' not registered")
+        self._filters[topic].append(filter_fn)
+
+    async def process_event(self, event: StreamEvent) -> bool:
+        """Process a single event through the filter chain.
+
+        Args:
+            event: Incoming stream event.
+
+        Returns:
+            ``True`` if the event passed all filters and was buffered.
+        """
+        await asyncio.sleep(0)
+
+        if event.topic not in self.topics:
+            logger.debug("Unknown topic '{}', dropping event", event.topic)
+            return False
+
+        for f in self._filters.get(event.topic, []):
+            if not f(event):
+                logger.debug("Event '{}' filtered out", event.event_id)
+                return False
+
+        self.topics[event.topic].append(event)
+        self._processed_count += 1
+        return True
+
+    async def process_batch(self, events: list[StreamEvent]) -> int:
+        """Process a batch of events asynchronously.
+
+        Args:
+            events: List of stream events.
+
+        Returns:
+            Number of events that passed filters.
+        """
+        results = await asyncio.gather(*[self.process_event(e) for e in events])
+        accepted = sum(1 for r in results if r)
+        logger.debug("Batch: {}/{} events accepted", accepted, len(events))
+        return accepted
+
+    def tumbling_window(
+        self,
+        topic: str,
+        window_size_s: float | None = None,
+    ) -> WindowResult:
+        """Compute a tumbling window aggregation for a topic.
+
+        Args:
+            topic: Topic to aggregate.
+            window_size_s: Window duration override.
+
+        Returns:
+            :class:`WindowResult` with aggregated values.
+
+        Raises:
+            KeyError: If topic is not registered.
+        """
+        if topic not in self.topics:
+            raise KeyError(f"Topic '{topic}' not registered")
+
+        ws = window_size_s or self._window_size_s
+        now = time.monotonic()
+        window_start = now - ws
+
+        events_in_window = [e for e in self.topics[topic] if e.timestamp >= window_start]
+        aggregations = self._aggregators[topic](events_in_window)
+
+        return WindowResult(
+            topic=topic,
+            window_start=window_start,
+            window_end=now,
+            n_events=len(events_in_window),
+            aggregations=aggregations,
+        )
+
+    @staticmethod
+    def _default_aggregator(events: list[StreamEvent]) -> dict[str, Any]:
+        """Default aggregator: count and collect unique partition keys.
+
+        Args:
+            events: Events in the window.
+
+        Returns:
+            Aggregation dictionary.
+        """
+        return {
+            "count": len(events),
+            "unique_partitions": len({e.partition_key for e in events}),
+        }
+
+    @property
+    def total_processed(self) -> int:
+        """Total number of events processed (including filtered)."""
+        return self._processed_count
diff --git a/llmops/__init__.py b/llmops/__init__.py
new file mode 100644
index 0000000..df5eaf4
--- /dev/null
+++ b/llmops/__init__.py
@@ -0,0 +1,80 @@
+"""LLMOps: Operations framework for managing large language models in trading systems."""
+
+from __future__ import annotations
+
+from loguru import logger
+
+from llmops.deployment.model_server import ModelServer
+from llmops.deployment.ab_testing import ABTesting
+from llmops.deployment.canary_deployment import CanaryDeployment
+from llmops.monitoring.drift_detection import DriftDetection
+from llmops.monitoring.performance_metrics import PerformanceMetrics
+from llmops.monitoring.hallucination_detector import HallucinationDetector
+from llmops.prompts.prompt_templates import PromptTemplates
+from llmops.prompts.prompt_optimizer import PromptOptimizer
+from llmops.prompts.context_injector import ContextInjector
+from llmops.training.fine_tuning import FineTuning
+from llmops.training.rlhf_pipeline import RLHFPipeline
+from llmops.training.continual_learning import ContinualLearning
+
+
+class LLMOps:
+    """Unified LLMOps orchestrator for trading platform language models.
+
+    Aggregates training, deployment, monitoring, and prompt management
+    capabilities into a single operational interface.
+
+    Attributes:
+        model_server: Async inference serving component.
+        ab_testing: A/B experiment management component.
+        canary: Canary rollout management component.
+        drift_detection: Model drift monitoring component.
+        performance_metrics: Model performance tracking component.
+        hallucination_detector: Output validation component.
+        prompt_templates: Reusable prompt library component.
+        prompt_optimizer: Automated prompt tuning component.
+        context_injector: Dynamic context injection component.
+        fine_tuning: Domain-specific fine-tuning component.
+        rlhf_pipeline: Reinforcement learning from feedback component.
+        continual_learning: Ongoing model update component.
+    """
+
+    def __init__(self) -> None:
+        """Initialise all LLMOps sub-components."""
+        self.model_server = ModelServer()
+        self.ab_testing = ABTesting()
+        self.canary = CanaryDeployment()
+        self.drift_detection = DriftDetection()
+        self.performance_metrics = PerformanceMetrics()
+        self.hallucination_detector = HallucinationDetector()
+        self.prompt_templates = PromptTemplates()
+        self.prompt_optimizer = PromptOptimizer()
+        self.context_injector = ContextInjector()
+        self.fine_tuning = FineTuning()
+        self.rlhf_pipeline = RLHFPipeline()
+        self.continual_learning = ContinualLearning()
+        logger.info("LLMOps initialised")
+
+    def status(self) -> dict[str, str]:
+        """Return a health summary for all sub-components.
+
+        Returns:
+            Mapping of component name to status string.
+        """
+        return {
+            "model_server": "ready",
+            "ab_testing": "ready",
+            "canary": "ready",
+            "drift_detection": "ready",
+            "performance_metrics": "ready",
+            "hallucination_detector": "ready",
+            "prompt_templates": "ready",
+            "prompt_optimizer": "ready",
+            "context_injector": "ready",
+            "fine_tuning": "ready",
+            "rlhf_pipeline": "ready",
+            "continual_learning": "ready",
+        }
+
+
+__all__ = ["LLMOps"]
diff --git a/llmops/__pycache__/__init__.cpython-312.pyc b/llmops/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..a0c671d
Binary files /dev/null and b/llmops/__pycache__/__init__.cpython-312.pyc differ
diff --git a/llmops/deployment/__init__.py b/llmops/deployment/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/llmops/deployment/__pycache__/__init__.cpython-312.pyc b/llmops/deployment/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..091664d
Binary files /dev/null and b/llmops/deployment/__pycache__/__init__.cpython-312.pyc differ
diff --git a/llmops/deployment/__pycache__/ab_testing.cpython-312.pyc b/llmops/deployment/__pycache__/ab_testing.cpython-312.pyc
new file mode 100644
index 0000000..371d016
Binary files /dev/null and b/llmops/deployment/__pycache__/ab_testing.cpython-312.pyc differ
diff --git a/llmops/deployment/__pycache__/canary_deployment.cpython-312.pyc b/llmops/deployment/__pycache__/canary_deployment.cpython-312.pyc
new file mode 100644
index 0000000..a0859aa
Binary files /dev/null and b/llmops/deployment/__pycache__/canary_deployment.cpython-312.pyc differ
diff --git a/llmops/deployment/__pycache__/model_server.cpython-312.pyc b/llmops/deployment/__pycache__/model_server.cpython-312.pyc
new file mode 100644
index 0000000..4617eb8
Binary files /dev/null and b/llmops/deployment/__pycache__/model_server.cpython-312.pyc differ
diff --git a/llmops/deployment/ab_testing.py b/llmops/deployment/ab_testing.py
new file mode 100644
index 0000000..76e45b8
--- /dev/null
+++ b/llmops/deployment/ab_testing.py
@@ -0,0 +1,355 @@
+"""A/B testing framework for model comparison with statistical significance."""
+
+from __future__ import annotations
+
+import asyncio
+import math
+import uuid
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class Experiment:
+    """An A/B experiment comparing two model variants.
+
+    Attributes:
+        experiment_id: Unique identifier.
+        name: Human-readable name.
+        control_model_id: Identifier of the control (baseline) model.
+        treatment_model_id: Identifier of the treatment (challenger) model.
+        traffic_split: Fraction of traffic routed to treatment (0–1).
+        created_at: UTC creation timestamp.
+        active: Whether the experiment is currently running.
+        min_samples: Minimum observations before analysis is valid.
+    """
+
+    experiment_id: str
+    name: str
+    control_model_id: str
+    treatment_model_id: str
+    traffic_split: float = 0.5
+    created_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    active: bool = True
+    min_samples: int = 100
+
+
+@dataclass
+class ExperimentResults:
+    """Statistical analysis results for an A/B experiment.
+
+    Attributes:
+        experiment_id: Identifier of the analysed experiment.
+        control_mean: Mean metric for the control group.
+        treatment_mean: Mean metric for the treatment group.
+        relative_lift: Relative improvement of treatment over control.
+        p_value: Two-sided p-value from a Welch t-test.
+        significant: Whether the result is statistically significant.
+        confidence_level: Confidence level used (e.g. 0.95).
+        n_control: Number of control observations.
+        n_treatment: Number of treatment observations.
+    """
+
+    experiment_id: str
+    control_mean: float
+    treatment_mean: float
+    relative_lift: float
+    p_value: float
+    significant: bool
+    confidence_level: float
+    n_control: int
+    n_treatment: int
+
+
+class ABTesting:
+    """Model A/B testing with statistical significance analysis.
+
+    Manages concurrent experiments, routes inference requests to the
+    appropriate model variant, and performs Welch's t-test to determine
+    significance.
+
+    Attributes:
+        experiments: Active and completed experiments keyed by ID.
+        _observations: Metric observations per experiment/variant.
+        _rng: Seeded random generator for reproducible routing.
+    """
+
+    def __init__(self, random_seed: int = 42) -> None:
+        """Initialise the A/B testing framework.
+
+        Args:
+            random_seed: Seed for the routing random number generator.
+        """
+        self.experiments: dict[str, Experiment] = {}
+        self._observations: dict[str, dict[str, list[float]]] = {}
+        self._rng = np.random.default_rng(seed=random_seed)
+        logger.info("ABTesting initialised")
+
+    def create_experiment(
+        self,
+        name: str,
+        control_model_id: str,
+        treatment_model_id: str,
+        traffic_split: float = 0.5,
+        min_samples: int = 100,
+    ) -> Experiment:
+        """Create and register a new A/B experiment.
+
+        Args:
+            name: Human-readable experiment name.
+            control_model_id: Model ID for the control variant.
+            treatment_model_id: Model ID for the treatment variant.
+            traffic_split: Fraction of traffic to treatment (0–1).
+            min_samples: Minimum samples per arm before analysis.
+
+        Returns:
+            The newly created :class:`Experiment`.
+
+        Raises:
+            ValueError: If ``traffic_split`` is not in (0, 1).
+            ValueError: If ``control_model_id == treatment_model_id``.
+        """
+        if not 0 < traffic_split < 1:
+            raise ValueError(f"traffic_split must be in (0, 1), got {traffic_split}")
+        if control_model_id == treatment_model_id:
+            raise ValueError("control and treatment models must differ")
+
+        experiment_id = str(uuid.uuid4())
+        experiment = Experiment(
+            experiment_id=experiment_id,
+            name=name,
+            control_model_id=control_model_id,
+            treatment_model_id=treatment_model_id,
+            traffic_split=traffic_split,
+            min_samples=min_samples,
+        )
+        self.experiments[experiment_id] = experiment
+        self._observations[experiment_id] = {"control": [], "treatment": []}
+        logger.info(
+            "Experiment '{}' created (id={}, split={:.0%} treatment)",
+            name,
+            experiment_id,
+            traffic_split,
+        )
+        return experiment
+
+    def route_request(self, experiment_id: str) -> tuple[str, str]:
+        """Determine which model variant should serve a request.
+
+        Args:
+            experiment_id: Identifier of the experiment.
+
+        Returns:
+            Tuple of ``(variant, model_id)`` where variant is either
+            ``"control"`` or ``"treatment"``.
+
+        Raises:
+            KeyError: If ``experiment_id`` is not found.
+            RuntimeError: If the experiment is no longer active.
+        """
+        experiment = self._get_active_experiment(experiment_id)
+        variant = (
+            "treatment"
+            if self._rng.random() < experiment.traffic_split
+            else "control"
+        )
+        model_id = (
+            experiment.treatment_model_id
+            if variant == "treatment"
+            else experiment.control_model_id
+        )
+        logger.debug("Routing request to {} ({})", variant, model_id)
+        return variant, model_id
+
+    def record_observation(
+        self,
+        experiment_id: str,
+        variant: str,
+        metric_value: float,
+    ) -> None:
+        """Record a metric observation for a variant.
+
+        Args:
+            experiment_id: Experiment identifier.
+            variant: ``"control"`` or ``"treatment"``.
+            metric_value: Observed metric value (e.g. latency, accuracy).
+
+        Raises:
+            KeyError: If ``experiment_id`` is not found.
+            ValueError: If ``variant`` is not ``"control"`` or ``"treatment"``.
+        """
+        if experiment_id not in self._observations:
+            raise KeyError(f"Experiment '{experiment_id}' not found")
+        if variant not in ("control", "treatment"):
+            raise ValueError(f"variant must be 'control' or 'treatment', got '{variant}'")
+        self._observations[experiment_id][variant].append(metric_value)
+
+    def analyze_results(
+        self,
+        experiment_id: str,
+        confidence_level: float = 0.95,
+    ) -> ExperimentResults:
+        """Analyse experiment results using Welch's t-test.
+
+        Args:
+            experiment_id: Experiment to analyse.
+            confidence_level: Statistical significance threshold (e.g. 0.95).
+
+        Returns:
+            :class:`ExperimentResults` with significance and lift metrics.
+
+        Raises:
+            KeyError: If ``experiment_id`` is not found.
+            ValueError: If either arm has fewer observations than
+                ``experiment.min_samples``.
+        """
+        if experiment_id not in self.experiments:
+            raise KeyError(f"Experiment '{experiment_id}' not found")
+
+        experiment = self.experiments[experiment_id]
+        obs = self._observations[experiment_id]
+        ctrl = np.asarray(obs["control"], dtype=float)
+        trt = np.asarray(obs["treatment"], dtype=float)
+
+        if len(ctrl) < experiment.min_samples or len(trt) < experiment.min_samples:
+            raise ValueError(
+                f"Insufficient data: control={len(ctrl)}, treatment={len(trt)}, "
+                f"need {experiment.min_samples} each"
+            )
+
+        ctrl_mean = float(np.mean(ctrl))
+        trt_mean = float(np.mean(trt))
+        relative_lift = (trt_mean - ctrl_mean) / (ctrl_mean + 1e-10)
+
+        p_value = self._welch_t_test(ctrl, trt)
+        alpha = 1.0 - confidence_level
+        significant = p_value < alpha
+
+        result = ExperimentResults(
+            experiment_id=experiment_id,
+            control_mean=round(ctrl_mean, 6),
+            treatment_mean=round(trt_mean, 6),
+            relative_lift=round(relative_lift, 4),
+            p_value=round(p_value, 6),
+            significant=significant,
+            confidence_level=confidence_level,
+            n_control=len(ctrl),
+            n_treatment=len(trt),
+        )
+        logger.info(
+            "Experiment '{}' analysis: lift={:.2%}, p={:.4f}, significant={}",
+            experiment.name,
+            relative_lift,
+            p_value,
+            significant,
+        )
+        return result
+
+    def _welch_t_test(self, a: np.ndarray, b: np.ndarray) -> float:
+        """Compute a two-sided Welch's t-test p-value.
+
+        Args:
+            a: Observations for group A.
+            b: Observations for group B.
+
+        Returns:
+            Two-sided p-value.
+        """
+        n_a, n_b = len(a), len(b)
+        mean_a, mean_b = np.mean(a), np.mean(b)
+        var_a = np.var(a, ddof=1) if n_a > 1 else 0.0
+        var_b = np.var(b, ddof=1) if n_b > 1 else 0.0
+
+        se = math.sqrt(var_a / n_a + var_b / n_b + 1e-12)
+        t_stat = (mean_a - mean_b) / se
+
+        # Welch–Satterthwaite degrees of freedom
+        num = (var_a / n_a + var_b / n_b) ** 2
+        denom = (var_a / n_a) ** 2 / (n_a - 1 + 1e-12) + (var_b / n_b) ** 2 / (n_b - 1 + 1e-12)
+        df = num / (denom + 1e-12)
+
+        # Approximate p-value using normal distribution for large df
+        z = abs(t_stat)
+        p_value = 2 * (1 - self._normal_cdf(z))
+        return float(np.clip(p_value, 0.0, 1.0))
+
+    @staticmethod
+    def _normal_cdf(z: float) -> float:
+        """Standard normal CDF via the error function.
+
+        Args:
+            z: Z-score.
+
+        Returns:
+            Probability P(Z ≤ z).
+        """
+        return 0.5 * (1 + math.erf(z / math.sqrt(2)))
+
+    def _get_active_experiment(self, experiment_id: str) -> Experiment:
+        """Fetch an active experiment by ID.
+
+        Args:
+            experiment_id: Experiment identifier.
+
+        Returns:
+            The :class:`Experiment` object.
+
+        Raises:
+            KeyError: If not found.
+            RuntimeError: If inactive.
+        """
+        if experiment_id not in self.experiments:
+            raise KeyError(f"Experiment '{experiment_id}' not found")
+        experiment = self.experiments[experiment_id]
+        if not experiment.active:
+            raise RuntimeError(f"Experiment '{experiment_id}' is no longer active")
+        return experiment
+
+    async def async_route_request(self, experiment_id: str) -> tuple[str, str]:
+        """Async wrapper around :meth:`route_request` for use in async pipelines.
+
+        Args:
+            experiment_id: Identifier of the experiment.
+
+        Returns:
+            Tuple of ``(variant, model_id)``.
+        """
+        return await asyncio.get_event_loop().run_in_executor(
+            None, self.route_request, experiment_id
+        )
+
+    async def async_analyze_results(
+        self,
+        experiment_id: str,
+        confidence_level: float = 0.95,
+    ) -> ExperimentResults:
+        """Async wrapper around :meth:`analyze_results` for use in async pipelines.
+
+        Args:
+            experiment_id: Experiment to analyse.
+            confidence_level: Statistical significance threshold.
+
+        Returns:
+            :class:`ExperimentResults` with significance and lift metrics.
+        """
+        return await asyncio.get_event_loop().run_in_executor(
+            None, self.analyze_results, experiment_id, confidence_level
+        )
+
+    def stop_experiment(self, experiment_id: str) -> None:
+        """Mark an experiment as inactive.
+
+        Args:
+            experiment_id: Experiment to stop.
+
+        Raises:
+            KeyError: If not found.
+        """
+        if experiment_id not in self.experiments:
+            raise KeyError(f"Experiment '{experiment_id}' not found")
+        self.experiments[experiment_id].active = False
+        logger.info("Experiment '{}' stopped", experiment_id)
diff --git a/llmops/deployment/canary_deployment.py b/llmops/deployment/canary_deployment.py
new file mode 100644
index 0000000..9ea0ffc
--- /dev/null
+++ b/llmops/deployment/canary_deployment.py
@@ -0,0 +1,289 @@
+"""Canary deployment manager for safe LLM rollouts."""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum, auto
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class DeploymentState(Enum):
+    """Lifecycle states of a canary deployment."""
+
+    PENDING = auto()
+    CANARY = auto()
+    PROMOTING = auto()
+    STABLE = auto()
+    ROLLING_BACK = auto()
+    ROLLED_BACK = auto()
+    FAILED = auto()
+
+
+@dataclass
+class CanaryConfig:
+    """Configuration for a canary deployment.
+
+    Attributes:
+        deployment_id: Unique identifier for the deployment.
+        model_id: Identifier of the new model version being deployed.
+        baseline_model_id: Identifier of the stable baseline model.
+        initial_traffic_pct: Starting traffic percentage for canary (0–100).
+        max_traffic_pct: Maximum traffic percentage for canary before promotion.
+        error_rate_threshold: Error rate above which auto-rollback triggers.
+        latency_threshold_ms: Latency above which auto-rollback triggers.
+        observation_window_s: Seconds to observe before promotion decisions.
+    """
+
+    deployment_id: str
+    model_id: str
+    baseline_model_id: str
+    initial_traffic_pct: float = 5.0
+    max_traffic_pct: float = 50.0
+    error_rate_threshold: float = 0.05
+    latency_threshold_ms: float = 500.0
+    observation_window_s: float = 60.0
+
+
+@dataclass
+class CanaryMetrics:
+    """Real-time metrics snapshot for a canary deployment.
+
+    Attributes:
+        deployment_id: Owning deployment identifier.
+        error_rate: Fraction of requests that errored.
+        p50_latency_ms: 50th percentile latency.
+        p99_latency_ms: 99th percentile latency.
+        requests_served: Total requests handled by the canary.
+        timestamp: UTC time of the snapshot.
+    """
+
+    deployment_id: str
+    error_rate: float
+    p50_latency_ms: float
+    p99_latency_ms: float
+    requests_served: int
+    timestamp: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class CanaryDeployment:
+    """Safe canary rollout manager for LLM model versions.
+
+    Manages traffic shifting, metric monitoring, and automated
+    promotion or rollback decisions.
+
+    Attributes:
+        deployments: Active and completed deployments keyed by ID.
+        _metrics_history: Per-deployment metric snapshots.
+        _states: Current lifecycle state per deployment.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the canary deployment manager."""
+        self.deployments: dict[str, CanaryConfig] = {}
+        self._metrics_history: dict[str, list[CanaryMetrics]] = {}
+        self._states: dict[str, DeploymentState] = {}
+        logger.info("CanaryDeployment manager initialised")
+
+    def deploy_canary(self, config: CanaryConfig) -> str:
+        """Register and activate a new canary deployment.
+
+        Args:
+            config: Canary deployment configuration.
+
+        Returns:
+            Deployment identifier.
+
+        Raises:
+            ValueError: If traffic percentages are out of range.
+            ValueError: If a deployment with the same ID already exists.
+        """
+        if not 0 < config.initial_traffic_pct < 100:
+            raise ValueError(
+                f"initial_traffic_pct must be in (0, 100), got {config.initial_traffic_pct}"
+            )
+        if config.initial_traffic_pct > config.max_traffic_pct:
+            raise ValueError(
+                "initial_traffic_pct must not exceed max_traffic_pct"
+            )
+        if config.deployment_id in self.deployments:
+            raise ValueError(f"Deployment '{config.deployment_id}' already exists")
+
+        self.deployments[config.deployment_id] = config
+        self._metrics_history[config.deployment_id] = []
+        self._states[config.deployment_id] = DeploymentState.CANARY
+
+        logger.info(
+            "Canary deployed: model='{}' at {:.0f}% traffic (id={})",
+            config.model_id,
+            config.initial_traffic_pct,
+            config.deployment_id,
+        )
+        return config.deployment_id
+
+    async def monitor_metrics(
+        self,
+        deployment_id: str,
+        n_samples: int = 50,
+    ) -> CanaryMetrics:
+        """Collect and record a metrics snapshot for the canary.
+
+        In production this would query observability infrastructure; here
+        it simulates realistic telemetry.
+
+        Args:
+            deployment_id: Deployment to monitor.
+            n_samples: Number of synthetic request samples to simulate.
+
+        Returns:
+            Current :class:`CanaryMetrics` snapshot.
+
+        Raises:
+            KeyError: If ``deployment_id`` is not found.
+        """
+        if deployment_id not in self.deployments:
+            raise KeyError(f"Deployment '{deployment_id}' not found")
+
+        await asyncio.sleep(0)
+        rng = np.random.default_rng(seed=int(datetime.now(timezone.utc).timestamp()) % (2**16))
+
+        latencies = rng.lognormal(mean=4.5, sigma=0.5, size=n_samples)  # ~ms
+        errors = rng.binomial(1, 0.01, size=n_samples)
+
+        metrics = CanaryMetrics(
+            deployment_id=deployment_id,
+            error_rate=round(float(errors.mean()), 4),
+            p50_latency_ms=round(float(np.percentile(latencies, 50)), 2),
+            p99_latency_ms=round(float(np.percentile(latencies, 99)), 2),
+            requests_served=n_samples,
+        )
+        self._metrics_history[deployment_id].append(metrics)
+        logger.debug(
+            "Canary metrics: err={:.2%}, p50={:.1f}ms, p99={:.1f}ms",
+            metrics.error_rate,
+            metrics.p50_latency_ms,
+            metrics.p99_latency_ms,
+        )
+        return metrics
+
+    async def promote(self, deployment_id: str) -> bool:
+        """Promote the canary to 100% traffic.
+
+        Checks that recent metrics are within thresholds before promoting.
+
+        Args:
+            deployment_id: Deployment to promote.
+
+        Returns:
+            ``True`` if promotion succeeded, ``False`` if blocked by metrics.
+
+        Raises:
+            KeyError: If ``deployment_id`` is not found.
+            RuntimeError: If the deployment is not in CANARY state.
+        """
+        config = self._get_deployment(deployment_id, expected_state=DeploymentState.CANARY)
+
+        metrics = await self.monitor_metrics(deployment_id)
+        if not self._metrics_healthy(metrics, config):
+            logger.warning(
+                "Promotion blocked for '{}': metrics unhealthy (err={:.2%}, p99={:.1f}ms)",
+                deployment_id,
+                metrics.error_rate,
+                metrics.p99_latency_ms,
+            )
+            return False
+
+        self._states[deployment_id] = DeploymentState.STABLE
+        logger.info(
+            "Canary '{}' promoted to stable (model='{}')",
+            deployment_id,
+            config.model_id,
+        )
+        return True
+
+    async def rollback(self, deployment_id: str, reason: str = "manual") -> None:
+        """Roll back the canary to the baseline model.
+
+        Args:
+            deployment_id: Deployment to roll back.
+            reason: Human-readable rollback reason for audit logging.
+
+        Raises:
+            KeyError: If ``deployment_id`` is not found.
+        """
+        if deployment_id not in self.deployments:
+            raise KeyError(f"Deployment '{deployment_id}' not found")
+
+        config = self.deployments[deployment_id]
+        self._states[deployment_id] = DeploymentState.ROLLED_BACK
+        await asyncio.sleep(0)
+        logger.warning(
+            "Canary '{}' rolled back to '{}': {}",
+            deployment_id,
+            config.baseline_model_id,
+            reason,
+        )
+
+    def get_state(self, deployment_id: str) -> DeploymentState:
+        """Return the current state of a deployment.
+
+        Args:
+            deployment_id: Deployment identifier.
+
+        Returns:
+            Current :class:`DeploymentState`.
+
+        Raises:
+            KeyError: If ``deployment_id`` is not found.
+        """
+        if deployment_id not in self._states:
+            raise KeyError(f"Deployment '{deployment_id}' not found")
+        return self._states[deployment_id]
+
+    def _metrics_healthy(self, metrics: CanaryMetrics, config: CanaryConfig) -> bool:
+        """Check whether canary metrics satisfy health thresholds.
+
+        Args:
+            metrics: Current telemetry snapshot.
+            config: Deployment configuration with threshold values.
+
+        Returns:
+            ``True`` if all thresholds are satisfied.
+        """
+        return (
+            metrics.error_rate <= config.error_rate_threshold
+            and metrics.p99_latency_ms <= config.latency_threshold_ms
+        )
+
+    def _get_deployment(
+        self,
+        deployment_id: str,
+        expected_state: DeploymentState | None = None,
+    ) -> CanaryConfig:
+        """Retrieve a deployment, optionally asserting its state.
+
+        Args:
+            deployment_id: Deployment identifier.
+            expected_state: If set, raises if current state differs.
+
+        Returns:
+            The :class:`CanaryConfig`.
+
+        Raises:
+            KeyError: If not found.
+            RuntimeError: If state assertion fails.
+        """
+        if deployment_id not in self.deployments:
+            raise KeyError(f"Deployment '{deployment_id}' not found")
+        if expected_state is not None:
+            current = self._states[deployment_id]
+            if current != expected_state:
+                raise RuntimeError(
+                    f"Deployment '{deployment_id}' is in state {current.name}, "
+                    f"expected {expected_state.name}"
+                )
+        return self.deployments[deployment_id]
diff --git a/llmops/deployment/model_server.py b/llmops/deployment/model_server.py
new file mode 100644
index 0000000..3f8af84
--- /dev/null
+++ b/llmops/deployment/model_server.py
@@ -0,0 +1,255 @@
+"""Async model server for LLM inference serving."""
+
+from __future__ import annotations
+
+import asyncio
+import time
+from dataclasses import dataclass, field
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class ModelConfig:
+    """Configuration for a served model.
+
+    Attributes:
+        model_id: Unique identifier for the model.
+        model_path: File path or URI of the model artefact.
+        max_batch_size: Maximum number of requests in a single batch.
+        timeout_seconds: Per-request inference timeout.
+        max_sequence_length: Maximum token length accepted.
+    """
+
+    model_id: str
+    model_path: str
+    max_batch_size: int = 32
+    timeout_seconds: float = 5.0
+    max_sequence_length: int = 2048
+
+
+@dataclass
+class PredictResult:
+    """Inference result from a single prediction.
+
+    Attributes:
+        model_id: Identifier of the model that produced the output.
+        output: Generated text or structured output.
+        latency_ms: Wall-clock inference latency in milliseconds.
+        tokens_generated: Number of output tokens produced.
+        confidence: Optional confidence score.
+    """
+
+    model_id: str
+    output: str
+    latency_ms: float
+    tokens_generated: int
+    confidence: float = 1.0
+
+
+@dataclass
+class HealthStatus:
+    """Health check response for the model server.
+
+    Attributes:
+        healthy: Overall health flag.
+        model_loaded: Whether a model is currently loaded.
+        uptime_seconds: Seconds since the server started.
+        requests_served: Total inference requests completed.
+        error_rate: Fraction of requests that resulted in errors.
+    """
+
+    healthy: bool
+    model_loaded: bool
+    uptime_seconds: float
+    requests_served: int
+    error_rate: float
+
+
+class ModelServer:
+    """Async inference server for LLM models.
+
+    Supports single-request and batch prediction, health-checking, and
+    model hot-swapping.  The default implementation simulates inference
+    without requiring an actual model runtime.
+
+    Attributes:
+        config: Currently loaded model configuration.
+        _loaded: Whether a model is currently ready for inference.
+        _start_time: Server start timestamp (monotonic).
+        _requests_served: Counter of completed requests.
+        _error_count: Counter of failed requests.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the model server in an unloaded state."""
+        self.config: ModelConfig | None = None
+        self._loaded: bool = False
+        self._start_time: float = time.monotonic()
+        self._requests_served: int = 0
+        self._error_count: int = 0
+        logger.info("ModelServer initialised")
+
+    async def load_model(self, config: ModelConfig) -> None:
+        """Load a model into the server.
+
+        Args:
+            config: Model configuration specifying the artefact path and
+                serving parameters.
+
+        Raises:
+            RuntimeError: If a model is already loaded; call ``unload_model``
+                first.
+        """
+        if self._loaded:
+            raise RuntimeError(
+                f"Model '{self.config.model_id}' already loaded. "  # type: ignore[union-attr]
+                "Call unload_model() first."
+            )
+        logger.info("Loading model '{}' from '{}'", config.model_id, config.model_path)
+        await asyncio.sleep(0)  # Simulate I/O loading
+        self.config = config
+        self._loaded = True
+        logger.info("Model '{}' loaded successfully", config.model_id)
+
+    async def unload_model(self) -> None:
+        """Unload the current model and free resources."""
+        if not self._loaded or self.config is None:
+            logger.warning("No model is currently loaded")
+            return
+        logger.info("Unloading model '{}'", self.config.model_id)
+        await asyncio.sleep(0)
+        self.config = None
+        self._loaded = False
+
+    async def predict(
+        self,
+        prompt: str,
+        max_tokens: int = 256,
+        temperature: float = 0.7,
+    ) -> PredictResult:
+        """Run inference on a single prompt.
+
+        Args:
+            prompt: Input text to the model.
+            max_tokens: Maximum number of tokens to generate.
+            temperature: Sampling temperature (0 = greedy, higher = more random).
+
+        Returns:
+            Inference result with generated text and latency.
+
+        Raises:
+            RuntimeError: If no model is loaded.
+            asyncio.TimeoutError: If inference exceeds the configured timeout.
+        """
+        if not self._loaded or self.config is None:
+            self._error_count += 1
+            raise RuntimeError("No model loaded. Call load_model() first.")
+
+        start = time.monotonic()
+        try:
+            result = await asyncio.wait_for(
+                self._run_inference(prompt, max_tokens, temperature),
+                timeout=self.config.timeout_seconds,
+            )
+        except asyncio.TimeoutError:
+            self._error_count += 1
+            raise
+        else:
+            self._requests_served += 1
+            latency_ms = (time.monotonic() - start) * 1000
+            result.latency_ms = round(latency_ms, 2)
+            return result
+
+    async def _run_inference(
+        self,
+        prompt: str,
+        max_tokens: int,
+        temperature: float,
+    ) -> PredictResult:
+        """Simulate model inference.
+
+        Args:
+            prompt: Input text.
+            max_tokens: Output length budget.
+            temperature: Sampling temperature.
+
+        Returns:
+            Simulated prediction result.
+        """
+        await asyncio.sleep(0)
+        rng = np.random.default_rng(seed=hash(prompt) % (2**32))
+        tokens_generated = int(rng.integers(10, min(max_tokens, 200)))
+        simulated_output = f"[{self.config.model_id}] Analysis of '{prompt[:40]}...': " \
+                           f"Simulated response with {tokens_generated} tokens."
+        confidence = float(rng.uniform(0.7, 0.99))
+
+        return PredictResult(
+            model_id=self.config.model_id,  # type: ignore[union-attr]
+            output=simulated_output,
+            latency_ms=0.0,  # filled by caller
+            tokens_generated=tokens_generated,
+            confidence=round(confidence, 4),
+        )
+
+    async def batch_predict(
+        self,
+        prompts: list[str],
+        max_tokens: int = 256,
+        temperature: float = 0.7,
+    ) -> list[PredictResult]:
+        """Run inference on a batch of prompts.
+
+        Prompts are processed concurrently up to ``config.max_batch_size``.
+
+        Args:
+            prompts: List of input prompts.
+            max_tokens: Maximum tokens per output.
+            temperature: Sampling temperature.
+
+        Returns:
+            List of inference results in the same order as ``prompts``.
+
+        Raises:
+            RuntimeError: If no model is loaded.
+            ValueError: If ``prompts`` is empty.
+        """
+        if not prompts:
+            raise ValueError("prompts must not be empty")
+        if not self._loaded or self.config is None:
+            raise RuntimeError("No model loaded. Call load_model() first.")
+
+        max_batch = self.config.max_batch_size
+        results: list[PredictResult] = []
+
+        for batch_start in range(0, len(prompts), max_batch):
+            batch = prompts[batch_start: batch_start + max_batch]
+            batch_results = await asyncio.gather(
+                *[self.predict(p, max_tokens, temperature) for p in batch]
+            )
+            results.extend(batch_results)
+
+        logger.debug("Batch predict: {} prompts, {} results", len(prompts), len(results))
+        return results
+
+    async def health_check(self) -> HealthStatus:
+        """Return the current health status of the server.
+
+        Returns:
+            :class:`HealthStatus` snapshot.
+        """
+        await asyncio.sleep(0)
+        uptime = time.monotonic() - self._start_time
+        total = self._requests_served + self._error_count
+        error_rate = self._error_count / total if total > 0 else 0.0
+
+        status = HealthStatus(
+            healthy=self._loaded,
+            model_loaded=self._loaded,
+            uptime_seconds=round(uptime, 2),
+            requests_served=self._requests_served,
+            error_rate=round(error_rate, 4),
+        )
+        return status
diff --git a/llmops/monitoring/__init__.py b/llmops/monitoring/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/llmops/monitoring/__pycache__/__init__.cpython-312.pyc b/llmops/monitoring/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..2b851d9
Binary files /dev/null and b/llmops/monitoring/__pycache__/__init__.cpython-312.pyc differ
diff --git a/llmops/monitoring/__pycache__/drift_detection.cpython-312.pyc b/llmops/monitoring/__pycache__/drift_detection.cpython-312.pyc
new file mode 100644
index 0000000..640bf98
Binary files /dev/null and b/llmops/monitoring/__pycache__/drift_detection.cpython-312.pyc differ
diff --git a/llmops/monitoring/__pycache__/hallucination_detector.cpython-312.pyc b/llmops/monitoring/__pycache__/hallucination_detector.cpython-312.pyc
new file mode 100644
index 0000000..1b48229
Binary files /dev/null and b/llmops/monitoring/__pycache__/hallucination_detector.cpython-312.pyc differ
diff --git a/llmops/monitoring/__pycache__/performance_metrics.cpython-312.pyc b/llmops/monitoring/__pycache__/performance_metrics.cpython-312.pyc
new file mode 100644
index 0000000..f8eb359
Binary files /dev/null and b/llmops/monitoring/__pycache__/performance_metrics.cpython-312.pyc differ
diff --git a/llmops/monitoring/drift_detection.py b/llmops/monitoring/drift_detection.py
new file mode 100644
index 0000000..bb2d621
--- /dev/null
+++ b/llmops/monitoring/drift_detection.py
@@ -0,0 +1,295 @@
+"""Model drift detection using PSI and KS statistical tests."""
+
+from __future__ import annotations
+
+import math
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class DriftReport:
+    """Report from a single drift detection evaluation.
+
+    Attributes:
+        feature_name: Name of the feature that was evaluated.
+        method: Statistical method used (``"psi"`` or ``"ks"``).
+        statistic: Test statistic value.
+        threshold: Threshold above which drift is declared.
+        drift_detected: Whether drift was declared.
+        severity: Categorical severity label.
+        evaluated_at: UTC timestamp of evaluation.
+    """
+
+    feature_name: str
+    method: str
+    statistic: float
+    threshold: float
+    drift_detected: bool
+    severity: str
+    evaluated_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+class DriftDetection:
+    """Model degradation and data drift detection.
+
+    Supports Population Stability Index (PSI) for distributional shift
+    and the Kolmogorov–Smirnov (KS) two-sample test for continuous
+    feature drift.
+
+    PSI severity thresholds (industry standard):
+      - PSI < 0.1  → no drift
+      - 0.1 ≤ PSI < 0.2 → minor drift
+      - PSI ≥ 0.2  → significant drift
+
+    Attributes:
+        reference_distributions: Stored reference distributions per feature.
+        drift_history: Log of all drift reports generated.
+        _psi_threshold: PSI threshold for declaring drift.
+        _ks_threshold: KS p-value threshold for declaring drift.
+    """
+
+    PSI_MINOR: float = 0.1
+    PSI_SIGNIFICANT: float = 0.2
+
+    def __init__(
+        self,
+        psi_threshold: float = 0.2,
+        ks_pvalue_threshold: float = 0.05,
+    ) -> None:
+        """Initialise the drift detector.
+
+        Args:
+            psi_threshold: PSI score above which drift is declared.
+            ks_pvalue_threshold: KS p-value below which drift is declared.
+        """
+        self.reference_distributions: dict[str, np.ndarray] = {}
+        self.drift_history: list[DriftReport] = []
+        self._psi_threshold = psi_threshold
+        self._ks_threshold = ks_pvalue_threshold
+        logger.info(
+            "DriftDetection initialised (psi_threshold={}, ks_pvalue_threshold={})",
+            psi_threshold,
+            ks_pvalue_threshold,
+        )
+
+    def set_reference(self, feature_name: str, data: np.ndarray) -> None:
+        """Store a reference distribution for a feature.
+
+        Args:
+            feature_name: Feature identifier.
+            data: 1-D array of reference observations.
+
+        Raises:
+            ValueError: If ``data`` is not 1-D or has fewer than 30 samples.
+        """
+        data = np.asarray(data, dtype=float).ravel()
+        if data.ndim != 1:
+            raise ValueError("data must be 1-D")
+        if len(data) < 30:
+            raise ValueError(f"Reference requires ≥30 samples, got {len(data)}")
+        self.reference_distributions[feature_name] = data
+        logger.info("Reference distribution set for feature '{}' ({} samples)", feature_name, len(data))
+
+    def compute_psi(
+        self,
+        feature_name: str,
+        current_data: np.ndarray,
+        n_bins: int = 10,
+    ) -> DriftReport:
+        """Compute PSI between the reference and current distributions.
+
+        Args:
+            feature_name: Feature to evaluate (must have a reference set).
+            current_data: 1-D array of current observations.
+            n_bins: Number of histogram buckets.
+
+        Returns:
+            :class:`DriftReport` with PSI result.
+
+        Raises:
+            KeyError: If no reference distribution exists for ``feature_name``.
+            ValueError: If ``current_data`` has fewer than 10 samples.
+        """
+        reference = self._get_reference(feature_name)
+        current_data = np.asarray(current_data, dtype=float).ravel()
+        if len(current_data) < 10:
+            raise ValueError(f"current_data requires ≥10 samples, got {len(current_data)}")
+
+        psi = self._psi(reference, current_data, n_bins)
+        severity = self._psi_severity(psi)
+        drift_detected = psi >= self._psi_threshold
+
+        report = DriftReport(
+            feature_name=feature_name,
+            method="psi",
+            statistic=round(psi, 6),
+            threshold=self._psi_threshold,
+            drift_detected=drift_detected,
+            severity=severity,
+        )
+        self.drift_history.append(report)
+        log = logger.warning if drift_detected else logger.debug
+        log(
+            "PSI for '{}': {:.4f} ({}) — drift={}",
+            feature_name,
+            psi,
+            severity,
+            drift_detected,
+        )
+        return report
+
+    def compute_ks(
+        self,
+        feature_name: str,
+        current_data: np.ndarray,
+    ) -> DriftReport:
+        """Compute KS two-sample test between reference and current data.
+
+        Args:
+            feature_name: Feature to evaluate (must have a reference set).
+            current_data: 1-D array of current observations.
+
+        Returns:
+            :class:`DriftReport` with KS statistic and approximate p-value.
+
+        Raises:
+            KeyError: If no reference distribution exists for ``feature_name``.
+        """
+        reference = self._get_reference(feature_name)
+        current_data = np.asarray(current_data, dtype=float).ravel()
+
+        ks_stat, p_value = self._ks_two_sample(reference, current_data)
+        drift_detected = p_value < self._ks_threshold
+        severity = "significant" if drift_detected else "none"
+
+        report = DriftReport(
+            feature_name=feature_name,
+            method="ks",
+            statistic=round(ks_stat, 6),
+            threshold=self._ks_threshold,
+            drift_detected=drift_detected,
+            severity=severity,
+        )
+        self.drift_history.append(report)
+        log = logger.warning if drift_detected else logger.debug
+        log(
+            "KS for '{}': stat={:.4f}, p={:.4f} — drift={}",
+            feature_name,
+            ks_stat,
+            p_value,
+            drift_detected,
+        )
+        return report
+
+    def evaluate_all(self, current_data: dict[str, np.ndarray]) -> dict[str, DriftReport]:
+        """Run PSI drift evaluation on all features with stored references.
+
+        Args:
+            current_data: Mapping of feature name to current observations.
+
+        Returns:
+            Mapping of feature name to :class:`DriftReport`.
+        """
+        results: dict[str, DriftReport] = {}
+        for feature_name, data in current_data.items():
+            if feature_name in self.reference_distributions:
+                results[feature_name] = self.compute_psi(feature_name, data)
+            else:
+                logger.warning("No reference for feature '{}', skipping", feature_name)
+        return results
+
+    def _psi(self, reference: np.ndarray, current: np.ndarray, n_bins: int) -> float:
+        """Calculate Population Stability Index.
+
+        Args:
+            reference: Reference distribution.
+            current: Current distribution.
+            n_bins: Number of histogram bins.
+
+        Returns:
+            PSI value.
+        """
+        eps = 1e-8
+        bin_edges = np.percentile(reference, np.linspace(0, 100, n_bins + 1))
+        bin_edges = np.unique(bin_edges)
+        if len(bin_edges) < 2:
+            return 0.0
+
+        ref_counts = np.histogram(reference, bins=bin_edges)[0].astype(float)
+        cur_counts = np.histogram(current, bins=bin_edges)[0].astype(float)
+
+        ref_pct = ref_counts / (ref_counts.sum() + eps)
+        cur_pct = cur_counts / (cur_counts.sum() + eps)
+        psi = float(np.sum((cur_pct - ref_pct) * np.log((cur_pct + eps) / (ref_pct + eps))))
+        return abs(psi)
+
+    def _ks_two_sample(
+        self, a: np.ndarray, b: np.ndarray
+    ) -> tuple[float, float]:
+        """Compute KS statistic and approximate p-value.
+
+        Args:
+            a: First sample.
+            b: Second sample.
+
+        Returns:
+            Tuple of ``(ks_statistic, p_value)``.
+        """
+        a_sorted = np.sort(a)
+        b_sorted = np.sort(b)
+        combined = np.concatenate([a_sorted, b_sorted])
+        combined = np.unique(combined)
+
+        cdf_a = np.searchsorted(a_sorted, combined, side="right") / len(a_sorted)
+        cdf_b = np.searchsorted(b_sorted, combined, side="right") / len(b_sorted)
+
+        ks_stat = float(np.max(np.abs(cdf_a - cdf_b)))
+
+        # Kolmogorov approximation for p-value
+        n = len(a) * len(b) / (len(a) + len(b))
+        lambda_val = (math.sqrt(n) + 0.12 + 0.11 / math.sqrt(n)) * ks_stat
+        p_value = float(2 * sum(
+            ((-1) ** (k - 1)) * math.exp(-2 * k * k * lambda_val ** 2)
+            for k in range(1, 20)
+        ))
+        p_value = float(np.clip(p_value, 0.0, 1.0))
+        return ks_stat, p_value
+
+    def _psi_severity(self, psi: float) -> str:
+        """Categorise PSI value into a severity label.
+
+        Args:
+            psi: PSI score.
+
+        Returns:
+            ``"none"``, ``"minor"``, or ``"significant"``.
+        """
+        if psi < self.PSI_MINOR:
+            return "none"
+        if psi < self.PSI_SIGNIFICANT:
+            return "minor"
+        return "significant"
+
+    def _get_reference(self, feature_name: str) -> np.ndarray:
+        """Retrieve a stored reference distribution.
+
+        Args:
+            feature_name: Feature identifier.
+
+        Returns:
+            Reference data array.
+
+        Raises:
+            KeyError: If no reference has been set for this feature.
+        """
+        if feature_name not in self.reference_distributions:
+            raise KeyError(
+                f"No reference distribution for feature '{feature_name}'. "
+                "Call set_reference() first."
+            )
+        return self.reference_distributions[feature_name]
diff --git a/llmops/monitoring/hallucination_detector.py b/llmops/monitoring/hallucination_detector.py
new file mode 100644
index 0000000..d4fdc6f
--- /dev/null
+++ b/llmops/monitoring/hallucination_detector.py
@@ -0,0 +1,295 @@
+"""Hallucination detection for LLM outputs using consistency and confidence checks."""
+
+from __future__ import annotations
+
+import re
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class HallucinationReport:
+    """Result of a hallucination detection evaluation.
+
+    Attributes:
+        output_id: Identifier for the evaluated output.
+        is_hallucination: Whether a hallucination was detected.
+        confidence_score: Model's self-reported confidence (0–1).
+        consistency_score: Internal consistency across multiple samples (0–1).
+        factual_score: Factual grounding score (0–1).
+        risk_level: Categorical risk (``"low"``, ``"medium"``, ``"high"``).
+        flags: Specific issues detected.
+        evaluated_at: UTC timestamp.
+    """
+
+    output_id: str
+    is_hallucination: bool
+    confidence_score: float
+    consistency_score: float
+    factual_score: float
+    risk_level: str
+    flags: list[str] = field(default_factory=list)
+    evaluated_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+
+# Patterns that correlate with low-confidence or hallucinated responses
+_UNCERTAINTY_PATTERNS: list[str] = [
+    r"\bi (think|believe|suppose|assume)\b",
+    r"\b(probably|possibly|perhaps|maybe|might be|could be)\b",
+    r"\bi('m| am) not (sure|certain|confident)\b",
+    r"\b(i|we) cannot (confirm|verify|guarantee)\b",
+    r"\bapproximately\b",
+]
+
+_CONTRADICTION_MARKERS: list[str] = [
+    r"\bhowever\b.*\bbut\b",
+    r"\bon the other hand\b",
+    r"\bcontradicts?\b",
+]
+
+
+class HallucinationDetector:
+    """LLM output validation using consistency checks and confidence scoring.
+
+    Uses three complementary signals:
+    1. **Confidence scoring**: Linguistic uncertainty patterns in the output.
+    2. **Consistency checking**: Agreement across multiple sampled outputs.
+    3. **Factual grounding**: Overlap with provided ground-truth context.
+
+    Attributes:
+        detection_history: All past detection reports.
+        _confidence_threshold: Minimum confidence before flagging.
+        _consistency_threshold: Minimum consistency score before flagging.
+        _factual_threshold: Minimum factual overlap before flagging.
+    """
+
+    def __init__(
+        self,
+        confidence_threshold: float = 0.6,
+        consistency_threshold: float = 0.7,
+        factual_threshold: float = 0.5,
+    ) -> None:
+        """Initialise the hallucination detector.
+
+        Args:
+            confidence_threshold: Outputs below this confidence are flagged.
+            consistency_threshold: Outputs below this consistency are flagged.
+            factual_threshold: Outputs below this factual overlap are flagged.
+        """
+        self.detection_history: list[HallucinationReport] = []
+        self._confidence_threshold = confidence_threshold
+        self._consistency_threshold = consistency_threshold
+        self._factual_threshold = factual_threshold
+        self._uncertainty_re = [
+            re.compile(p, re.IGNORECASE) for p in _UNCERTAINTY_PATTERNS
+        ]
+        self._contradiction_re = [
+            re.compile(p, re.IGNORECASE) for p in _CONTRADICTION_MARKERS
+        ]
+        logger.info(
+            "HallucinationDetector initialised (conf={}, consist={}, fact={})",
+            confidence_threshold,
+            consistency_threshold,
+            factual_threshold,
+        )
+
+    def detect(
+        self,
+        output: str,
+        output_id: str | None = None,
+        context: str | None = None,
+        sampled_outputs: list[str] | None = None,
+    ) -> HallucinationReport:
+        """Evaluate a single LLM output for hallucination signals.
+
+        Args:
+            output: The LLM-generated text to evaluate.
+            output_id: Optional identifier (auto-generated if ``None``).
+            context: Optional ground-truth or retrieval context for factual
+                grounding check.
+            sampled_outputs: Optional list of alternative outputs sampled at
+                higher temperature for consistency checking.
+
+        Returns:
+            :class:`HallucinationReport` with all scoring results.
+
+        Raises:
+            ValueError: If ``output`` is empty.
+        """
+        if not output.strip():
+            raise ValueError("output must not be empty")
+
+        oid = output_id or f"output_{len(self.detection_history)}"
+        flags: list[str] = []
+
+        confidence_score = self._score_confidence(output, flags)
+        consistency_score = self._score_consistency(output, sampled_outputs, flags)
+        factual_score = self._score_factual(output, context, flags)
+
+        is_hallucination = (
+            confidence_score < self._confidence_threshold
+            or consistency_score < self._consistency_threshold
+            or factual_score < self._factual_threshold
+        )
+        risk_level = self._compute_risk(confidence_score, consistency_score, factual_score)
+
+        report = HallucinationReport(
+            output_id=oid,
+            is_hallucination=is_hallucination,
+            confidence_score=round(confidence_score, 4),
+            consistency_score=round(consistency_score, 4),
+            factual_score=round(factual_score, 4),
+            risk_level=risk_level,
+            flags=flags,
+        )
+        self.detection_history.append(report)
+
+        if is_hallucination:
+            logger.warning(
+                "Hallucination detected (id={}) — risk={}, flags={}",
+                oid,
+                risk_level,
+                flags,
+            )
+        else:
+            logger.debug("Output '{}' passed hallucination checks (risk={})", oid, risk_level)
+
+        return report
+
+    def batch_detect(
+        self,
+        outputs: list[str],
+        context: str | None = None,
+    ) -> list[HallucinationReport]:
+        """Evaluate a batch of outputs.
+
+        Args:
+            outputs: List of LLM-generated texts.
+            context: Shared context for factual grounding checks.
+
+        Returns:
+            List of :class:`HallucinationReport` in the same order.
+        """
+        return [
+            self.detect(output, output_id=f"output_{i}", context=context)
+            for i, output in enumerate(outputs)
+        ]
+
+    def _score_confidence(self, output: str, flags: list[str]) -> float:
+        """Estimate output confidence from linguistic uncertainty patterns.
+
+        Args:
+            output: Model output text.
+            flags: Mutable list to append detected flag descriptions.
+
+        Returns:
+            Confidence score in [0, 1] (higher is better).
+        """
+        hit_count = sum(
+            1 for pattern in self._uncertainty_re if pattern.search(output)
+        )
+        contradiction_count = sum(
+            1 for pattern in self._contradiction_re if pattern.search(output)
+        )
+
+        total_hits = hit_count + contradiction_count
+        if total_hits > 0:
+            flags.append(f"uncertainty_patterns:{total_hits}")
+
+        # Score decays with number of uncertainty matches
+        score = max(0.0, 1.0 - 0.15 * total_hits)
+        return float(score)
+
+    def _score_consistency(
+        self,
+        output: str,
+        sampled_outputs: list[str] | None,
+        flags: list[str],
+    ) -> float:
+        """Measure consistency of an output against sampled alternatives.
+
+        Uses normalised word-level Jaccard similarity.
+
+        Args:
+            output: Primary model output.
+            sampled_outputs: Alternative sampled outputs (optional).
+            flags: Mutable list to append flag descriptions.
+
+        Returns:
+            Consistency score in [0, 1].
+        """
+        if not sampled_outputs:
+            return 1.0  # Cannot assess — default to passing
+
+        output_words = set(output.lower().split())
+        similarities: list[float] = []
+
+        for alt in sampled_outputs:
+            alt_words = set(alt.lower().split())
+            intersection = len(output_words & alt_words)
+            union = len(output_words | alt_words)
+            similarities.append(intersection / union if union > 0 else 0.0)
+
+        mean_sim = float(np.mean(similarities))
+        if mean_sim < self._consistency_threshold:
+            flags.append(f"low_consistency:{mean_sim:.2f}")
+
+        return mean_sim
+
+    def _score_factual(
+        self,
+        output: str,
+        context: str | None,
+        flags: list[str],
+    ) -> float:
+        """Measure factual overlap between output and provided context.
+
+        Args:
+            output: Model output text.
+            context: Ground-truth or retrieval context.
+            flags: Mutable list to append flag descriptions.
+
+        Returns:
+            Factual grounding score in [0, 1].
+        """
+        if not context:
+            return 1.0  # Cannot assess — default to passing
+
+        output_words = set(output.lower().split())
+        context_words = set(context.lower().split())
+
+        if not output_words:
+            return 0.0
+
+        overlap = len(output_words & context_words) / len(output_words)
+        if overlap < self._factual_threshold:
+            flags.append(f"low_factual_overlap:{overlap:.2f}")
+
+        return float(overlap)
+
+    def _compute_risk(
+        self,
+        confidence: float,
+        consistency: float,
+        factual: float,
+    ) -> str:
+        """Derive a categorical risk level from the three sub-scores.
+
+        Args:
+            confidence: Confidence score.
+            consistency: Consistency score.
+            factual: Factual score.
+
+        Returns:
+            ``"low"``, ``"medium"``, or ``"high"``.
+        """
+        avg = (confidence + consistency + factual) / 3.0
+        if avg >= 0.75:
+            return "low"
+        if avg >= 0.5:
+            return "medium"
+        return "high"
diff --git a/llmops/monitoring/performance_metrics.py b/llmops/monitoring/performance_metrics.py
new file mode 100644
index 0000000..f9fedb6
--- /dev/null
+++ b/llmops/monitoring/performance_metrics.py
@@ -0,0 +1,224 @@
+"""Performance metrics tracking for LLM models over time."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class MetricSnapshot:
+    """A snapshot of model performance metrics at a point in time.
+
+    Attributes:
+        accuracy: Fraction of correct predictions.
+        precision: Precision score (TP / (TP + FP)).
+        recall: Recall score (TP / (TP + FN)).
+        f1_score: Harmonic mean of precision and recall.
+        auc_roc: Area under the ROC curve.
+        n_samples: Number of evaluation samples.
+        recorded_at: UTC timestamp of the snapshot.
+        model_id: Identifier of the evaluated model.
+    """
+
+    accuracy: float
+    precision: float
+    recall: float
+    f1_score: float
+    auc_roc: float
+    n_samples: int
+    recorded_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    model_id: str = "default"
+
+
+class PerformanceMetrics:
+    """Track and compute model performance metrics over time.
+
+    Accumulates per-prediction labels and scores to compute standard
+    classification metrics, and retains a time-series history of
+    :class:`MetricSnapshot` objects for trend analysis.
+
+    Attributes:
+        history: Ordered list of metric snapshots.
+        _y_true: Accumulated ground-truth labels.
+        _y_pred: Accumulated predicted labels.
+        _y_scores: Accumulated probability scores for AUC computation.
+    """
+
+    def __init__(self) -> None:
+        """Initialise the performance metrics tracker."""
+        self.history: list[MetricSnapshot] = []
+        self._y_true: list[int] = []
+        self._y_pred: list[int] = []
+        self._y_scores: list[float] = []
+        logger.info("PerformanceMetrics initialised")
+
+    def record_prediction(
+        self,
+        y_true: int,
+        y_pred: int,
+        y_score: float | None = None,
+    ) -> None:
+        """Record a single prediction for metric accumulation.
+
+        Args:
+            y_true: Ground-truth label (0 or 1).
+            y_pred: Predicted label (0 or 1).
+            y_score: Optional probability score for the positive class (0–1).
+
+        Raises:
+            ValueError: If labels are not 0 or 1, or if score is outside [0, 1].
+        """
+        if y_true not in (0, 1):
+            raise ValueError(f"y_true must be 0 or 1, got {y_true}")
+        if y_pred not in (0, 1):
+            raise ValueError(f"y_pred must be 0 or 1, got {y_pred}")
+        if y_score is not None and not 0.0 <= y_score <= 1.0:
+            raise ValueError(f"y_score must be in [0, 1], got {y_score}")
+
+        self._y_true.append(y_true)
+        self._y_pred.append(y_pred)
+        self._y_scores.append(y_score if y_score is not None else float(y_pred))
+
+    def record_batch(
+        self,
+        y_true: list[int],
+        y_pred: list[int],
+        y_scores: list[float] | None = None,
+    ) -> None:
+        """Record a batch of predictions.
+
+        Args:
+            y_true: List of ground-truth labels.
+            y_pred: List of predicted labels.
+            y_scores: Optional list of probability scores.
+
+        Raises:
+            ValueError: If lengths of input lists do not match.
+        """
+        if len(y_true) != len(y_pred):
+            raise ValueError(
+                f"Length mismatch: y_true={len(y_true)}, y_pred={len(y_pred)}"
+            )
+        if y_scores is not None and len(y_scores) != len(y_true):
+            raise ValueError(
+                f"Length mismatch: y_true={len(y_true)}, y_scores={len(y_scores)}"
+            )
+
+        scores_iter = y_scores or [None] * len(y_true)  # type: ignore[list-item]
+        for yt, yp, ys in zip(y_true, y_pred, scores_iter):
+            self.record_prediction(yt, yp, ys)
+
+    def compute_snapshot(self, model_id: str = "default") -> MetricSnapshot:
+        """Compute a metric snapshot from accumulated predictions.
+
+        Args:
+            model_id: Identifier to attach to the snapshot.
+
+        Returns:
+            :class:`MetricSnapshot` with all metrics computed.
+
+        Raises:
+            RuntimeError: If fewer than two predictions have been recorded.
+        """
+        if len(self._y_true) < 2:
+            raise RuntimeError(
+                "At least 2 predictions must be recorded before computing metrics"
+            )
+
+        yt = np.asarray(self._y_true, dtype=int)
+        yp = np.asarray(self._y_pred, dtype=int)
+        ys = np.asarray(self._y_scores, dtype=float)
+
+        accuracy = float(np.mean(yt == yp))
+        tp = int(np.sum((yt == 1) & (yp == 1)))
+        fp = int(np.sum((yt == 0) & (yp == 1)))
+        fn = int(np.sum((yt == 1) & (yp == 0)))
+
+        precision = tp / (tp + fp) if (tp + fp) > 0 else 0.0
+        recall = tp / (tp + fn) if (tp + fn) > 0 else 0.0
+        f1 = (
+            2 * precision * recall / (precision + recall)
+            if (precision + recall) > 0
+            else 0.0
+        )
+        auc = self._compute_auc(yt, ys)
+
+        snapshot = MetricSnapshot(
+            accuracy=round(accuracy, 4),
+            precision=round(precision, 4),
+            recall=round(recall, 4),
+            f1_score=round(f1, 4),
+            auc_roc=round(auc, 4),
+            n_samples=len(yt),
+            model_id=model_id,
+        )
+        self.history.append(snapshot)
+        logger.info(
+            "Metrics snapshot: acc={:.4f}, f1={:.4f}, auc={:.4f} (n={})",
+            accuracy,
+            f1,
+            auc,
+            len(yt),
+        )
+        return snapshot
+
+    def reset(self) -> None:
+        """Clear accumulated predictions (keeps history)."""
+        self._y_true.clear()
+        self._y_pred.clear()
+        self._y_scores.clear()
+        logger.debug("Prediction buffer reset")
+
+    def trend(self, metric: str = "f1_score") -> np.ndarray:
+        """Return the time-series of a metric from history.
+
+        Args:
+            metric: Attribute name on :class:`MetricSnapshot` to extract.
+
+        Returns:
+            1-D numpy array of metric values over time.
+
+        Raises:
+            AttributeError: If ``metric`` is not a valid snapshot attribute.
+            ValueError: If history is empty.
+        """
+        if not self.history:
+            raise ValueError("No metric history available")
+        if not hasattr(self.history[0], metric):
+            raise AttributeError(f"MetricSnapshot has no attribute '{metric}'")
+        return np.array([getattr(s, metric) for s in self.history])
+
+    def _compute_auc(self, y_true: np.ndarray, y_scores: np.ndarray) -> float:
+        """Compute AUC-ROC using the trapezoidal rule.
+
+        Args:
+            y_true: Binary ground-truth labels.
+            y_scores: Probability scores for the positive class.
+
+        Returns:
+            AUC-ROC value between 0 and 1.
+        """
+        if len(np.unique(y_true)) < 2:
+            return 0.5  # degenerate case
+
+        thresholds = np.sort(np.unique(y_scores))[::-1]
+        tprs = [0.0]
+        fprs = [0.0]
+
+        n_pos = int(np.sum(y_true == 1))
+        n_neg = int(np.sum(y_true == 0))
+
+        for thresh in thresholds:
+            y_pred_t = (y_scores >= thresh).astype(int)
+            tp = int(np.sum((y_true == 1) & (y_pred_t == 1)))
+            fp = int(np.sum((y_true == 0) & (y_pred_t == 1)))
+            tprs.append(tp / n_pos if n_pos > 0 else 0.0)
+            fprs.append(fp / n_neg if n_neg > 0 else 0.0)
+
+        tprs.append(1.0)
+        fprs.append(1.0)
+        return float(np.trapezoid(tprs, fprs))
diff --git a/llmops/prompts/__init__.py b/llmops/prompts/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/llmops/prompts/__pycache__/__init__.cpython-312.pyc b/llmops/prompts/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..a81853a
Binary files /dev/null and b/llmops/prompts/__pycache__/__init__.cpython-312.pyc differ
diff --git a/llmops/prompts/__pycache__/context_injector.cpython-312.pyc b/llmops/prompts/__pycache__/context_injector.cpython-312.pyc
new file mode 100644
index 0000000..9c220bd
Binary files /dev/null and b/llmops/prompts/__pycache__/context_injector.cpython-312.pyc differ
diff --git a/llmops/prompts/__pycache__/prompt_optimizer.cpython-312.pyc b/llmops/prompts/__pycache__/prompt_optimizer.cpython-312.pyc
new file mode 100644
index 0000000..36fa2ce
Binary files /dev/null and b/llmops/prompts/__pycache__/prompt_optimizer.cpython-312.pyc differ
diff --git a/llmops/prompts/__pycache__/prompt_templates.cpython-312.pyc b/llmops/prompts/__pycache__/prompt_templates.cpython-312.pyc
new file mode 100644
index 0000000..069416e
Binary files /dev/null and b/llmops/prompts/__pycache__/prompt_templates.cpython-312.pyc differ
diff --git a/llmops/prompts/context_injector.py b/llmops/prompts/context_injector.py
new file mode 100644
index 0000000..07e55bc
--- /dev/null
+++ b/llmops/prompts/context_injector.py
@@ -0,0 +1,269 @@
+"""Dynamic context injection into prompts with market data and portfolio state."""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+from loguru import logger
+
+
+@dataclass
+class MarketContext:
+    """Real-time market data context for prompt injection.
+
+    Attributes:
+        symbol: Trading instrument identifier.
+        price: Current mid-price.
+        bid: Current best bid.
+        ask: Current best ask.
+        volume_24h: 24-hour traded volume.
+        price_change_pct: 24-hour price change percentage.
+        high_24h: 24-hour high price.
+        low_24h: 24-hour low price.
+        timestamp: UTC time of the data snapshot.
+    """
+
+    symbol: str
+    price: float
+    bid: float
+    ask: float
+    volume_24h: float
+    price_change_pct: float
+    high_24h: float
+    low_24h: float
+    timestamp: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+    def to_text(self) -> str:
+        """Render to a compact, human-readable block for prompt injection.
+
+        Returns:
+            Multi-line market data string.
+        """
+        return (
+            f"Symbol: {self.symbol}\n"
+            f"Price: {self.price:.4f} (Bid: {self.bid:.4f} / Ask: {self.ask:.4f})\n"
+            f"24h Change: {self.price_change_pct:+.2f}%\n"
+            f"24h Range: {self.low_24h:.4f} – {self.high_24h:.4f}\n"
+            f"Volume (24h): {self.volume_24h:,.0f}\n"
+            f"As of: {self.timestamp.strftime('%Y-%m-%d %H:%M:%S UTC')}"
+        )
+
+
+@dataclass
+class PortfolioState:
+    """Current portfolio state for prompt injection.
+
+    Attributes:
+        total_value: Total portfolio value in base currency.
+        cash: Uninvested cash balance.
+        positions: Mapping of symbol to position dict with keys
+            ``"qty"``, ``"avg_cost"``, ``"pnl"``.
+        unrealised_pnl: Total unrealised profit/loss.
+        realised_pnl_today: Realised P&L for the current trading day.
+        exposure_pct: Percentage of portfolio invested.
+    """
+
+    total_value: float
+    cash: float
+    positions: dict[str, dict[str, float]] = field(default_factory=dict)
+    unrealised_pnl: float = 0.0
+    realised_pnl_today: float = 0.0
+    exposure_pct: float = 0.0
+
+    def to_text(self) -> str:
+        """Render to a compact, human-readable block.
+
+        Returns:
+            Multi-line portfolio summary string.
+        """
+        pos_lines = "\n".join(
+            f"  {sym}: qty={p.get('qty', 0):.2f}, "
+            f"avg_cost={p.get('avg_cost', 0):.4f}, "
+            f"pnl={p.get('pnl', 0):+.2f}"
+            for sym, p in self.positions.items()
+        ) or "  (no open positions)"
+        return (
+            f"Total Value: {self.total_value:,.2f}\n"
+            f"Cash: {self.cash:,.2f}\n"
+            f"Exposure: {self.exposure_pct:.1f}%\n"
+            f"Unrealised PnL: {self.unrealised_pnl:+,.2f}\n"
+            f"Realised PnL (today): {self.realised_pnl_today:+,.2f}\n"
+            f"Positions:\n{pos_lines}"
+        )
+
+
+@dataclass
+class NewsContext:
+    """Recent news headlines for prompt injection.
+
+    Attributes:
+        headlines: List of recent news headline strings.
+        sentiment_score: Aggregate sentiment score (−1 to +1).
+        source: News data source identifier.
+        retrieved_at: UTC time of retrieval.
+    """
+
+    headlines: list[str]
+    sentiment_score: float = 0.0
+    source: str = "aggregated"
+    retrieved_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+
+    def to_text(self, max_headlines: int = 5) -> str:
+        """Render headlines to a compact block.
+
+        Args:
+            max_headlines: Maximum number of headlines to include.
+
+        Returns:
+            Multi-line news summary string.
+        """
+        top = self.headlines[:max_headlines]
+        bullets = "\n".join(f"  • {h}" for h in top)
+        return (
+            f"Source: {self.source} | "
+            f"Sentiment: {self.sentiment_score:+.2f}\n"
+            f"{bullets}"
+        )
+
+
+class ContextInjector:
+    """Dynamic context injection for trading platform prompts.
+
+    Retrieves and formats market data, portfolio state, and news context
+    for injection into LLM prompts at inference time.
+
+    Attributes:
+        _market_data_fetcher: Optional async callable returning
+            :class:`MarketContext` for a given symbol.
+        _portfolio_fetcher: Optional async callable returning
+            :class:`PortfolioState`.
+        _news_fetcher: Optional async callable returning
+            :class:`NewsContext` for a given symbol.
+        _cache: Simple in-memory context cache.
+    """
+
+    def __init__(
+        self,
+        market_data_fetcher: Any | None = None,
+        portfolio_fetcher: Any | None = None,
+        news_fetcher: Any | None = None,
+    ) -> None:
+        """Initialise the context injector.
+
+        Args:
+            market_data_fetcher: Optional async callable ``(symbol) → MarketContext``.
+            portfolio_fetcher: Optional async callable ``() → PortfolioState``.
+            news_fetcher: Optional async callable ``(symbol) → NewsContext``.
+        """
+        self._market_data_fetcher = market_data_fetcher
+        self._portfolio_fetcher = portfolio_fetcher
+        self._news_fetcher = news_fetcher
+        self._cache: dict[str, Any] = {}
+        logger.info("ContextInjector initialised")
+
+    async def build_context(
+        self,
+        symbol: str,
+        include_market: bool = True,
+        include_portfolio: bool = True,
+        include_news: bool = True,
+    ) -> dict[str, str]:
+        """Assemble all requested context blocks asynchronously.
+
+        Args:
+            symbol: Trading instrument symbol for market and news context.
+            include_market: Whether to include market data context.
+            include_portfolio: Whether to include portfolio state context.
+            include_news: Whether to include news context.
+
+        Returns:
+            Mapping of context key (``"market"``, ``"portfolio"``, ``"news"``)
+            to formatted text block.
+        """
+        tasks: dict[str, asyncio.Task[Any]] = {}
+
+        if include_market:
+            tasks["market"] = asyncio.create_task(self._get_market(symbol))
+        if include_portfolio:
+            tasks["portfolio"] = asyncio.create_task(self._get_portfolio())
+        if include_news:
+            tasks["news"] = asyncio.create_task(self._get_news(symbol))
+
+        results: dict[str, str] = {}
+        for key, task in tasks.items():
+            try:
+                value = await task
+                results[key] = value
+            except Exception as exc:
+                logger.warning("Failed to fetch '{}' context: {}", key, exc)
+                results[key] = f"(context unavailable: {exc})"
+
+        return results
+
+    def inject(self, prompt: str, context: dict[str, str]) -> str:
+        """Prepend context blocks to a prompt string.
+
+        Args:
+            prompt: Base prompt text.
+            context: Context mapping returned by :meth:`build_context`.
+
+        Returns:
+            Prompt with context prepended in a structured header.
+        """
+        if not context:
+            return prompt
+
+        header_parts: list[str] = ["=== LIVE CONTEXT ==="]
+        for key, text in context.items():
+            header_parts.append(f"[{key.upper()}]\n{text}")
+        header_parts.append("=== END CONTEXT ===\n")
+        header = "\n\n".join(header_parts)
+        return f"{header}\n{prompt}"
+
+    async def _get_market(self, symbol: str) -> str:
+        """Fetch and format market data.
+
+        Args:
+            symbol: Instrument identifier.
+
+        Returns:
+            Formatted market data string.
+        """
+        if self._market_data_fetcher is not None:
+            market: MarketContext = await self._market_data_fetcher(symbol)
+            return market.to_text()
+        # Simulated fallback
+        await asyncio.sleep(0)
+        return (
+            f"Symbol: {symbol}\nPrice: N/A\n(live feed not configured)"
+        )
+
+    async def _get_portfolio(self) -> str:
+        """Fetch and format portfolio state.
+
+        Returns:
+            Formatted portfolio summary string.
+        """
+        if self._portfolio_fetcher is not None:
+            portfolio: PortfolioState = await self._portfolio_fetcher()
+            return portfolio.to_text()
+        await asyncio.sleep(0)
+        return "Portfolio: N/A (feed not configured)"
+
+    async def _get_news(self, symbol: str) -> str:
+        """Fetch and format news context.
+
+        Args:
+            symbol: Instrument identifier.
+
+        Returns:
+            Formatted news block string.
+        """
+        if self._news_fetcher is not None:
+            news: NewsContext = await self._news_fetcher(symbol)
+            return news.to_text()
+        await asyncio.sleep(0)
+        return f"News for {symbol}: N/A (feed not configured)"
diff --git a/llmops/prompts/prompt_optimizer.py b/llmops/prompts/prompt_optimizer.py
new file mode 100644
index 0000000..eb8faed
--- /dev/null
+++ b/llmops/prompts/prompt_optimizer.py
@@ -0,0 +1,255 @@
+"""Automatic prompt optimisation using A/B testing and performance metrics."""
+
+from __future__ import annotations
+
+import asyncio
+import uuid
+from dataclasses import dataclass, field
+from typing import Any, Callable, Awaitable
+
+import numpy as np
+from loguru import logger
+
+from llmops.prompts.prompt_templates import PromptTemplate
+
+
+@dataclass
+class OptimizationTrial:
+    """A single optimisation trial comparing a candidate prompt to a baseline.
+
+    Attributes:
+        trial_id: Unique identifier.
+        baseline_template: The current production prompt template.
+        candidate_template: The challenger prompt template.
+        metric_fn: Async callable that takes a rendered prompt and returns a
+            scalar performance metric (higher is better).
+        n_samples: Number of test samples to evaluate.
+        results: Metric values collected during the trial.
+    """
+
+    trial_id: str
+    baseline_template: PromptTemplate
+    candidate_template: PromptTemplate
+    metric_fn: Callable[[str], Awaitable[float]]
+    n_samples: int = 50
+    results: dict[str, list[float]] = field(default_factory=lambda: {"baseline": [], "candidate": []})
+
+
+@dataclass
+class OptimizationResult:
+    """Outcome of a completed optimisation trial.
+
+    Attributes:
+        trial_id: Identifier of the completed trial.
+        winner: ``"baseline"`` or ``"candidate"``.
+        baseline_mean: Mean metric for the baseline.
+        candidate_mean: Mean metric for the candidate.
+        relative_improvement: Fractional improvement of winner over loser.
+        p_value: Statistical significance p-value.
+        significant: Whether the result is statistically significant.
+        accepted: Whether the candidate was accepted as the new baseline.
+    """
+
+    trial_id: str
+    winner: str
+    baseline_mean: float
+    candidate_mean: float
+    relative_improvement: float
+    p_value: float
+    significant: bool
+    accepted: bool
+
+
+class PromptOptimizer:
+    """Automatic prompt optimisation via sequential A/B trials.
+
+    Generates prompt variants through simple mutations and evaluates
+    them against a provided performance metric function.  Winning
+    variants are promoted to become the new baseline.
+
+    Attributes:
+        best_templates: Best-known template per template name.
+        trial_history: Completed trial results.
+        _alpha: Statistical significance threshold.
+    """
+
+    def __init__(self, alpha: float = 0.05) -> None:
+        """Initialise the prompt optimizer.
+
+        Args:
+            alpha: Significance level for hypothesis testing (default 0.05).
+        """
+        self.best_templates: dict[str, PromptTemplate] = {}
+        self.trial_history: list[OptimizationResult] = []
+        self._alpha = alpha
+        logger.info("PromptOptimizer initialised (alpha={})", alpha)
+
+    async def optimize(
+        self,
+        baseline: PromptTemplate,
+        metric_fn: Callable[[str], Awaitable[float]],
+        render_kwargs: dict[str, Any],
+        n_samples: int = 50,
+        n_variants: int = 3,
+    ) -> PromptTemplate:
+        """Optimise a prompt template through iterative A/B trials.
+
+        Generates ``n_variants`` mutations of the baseline, evaluates each
+        against ``metric_fn``, and returns the best-performing variant.
+
+        Args:
+            baseline: Starting prompt template.
+            metric_fn: Async function scoring a rendered prompt (higher=better).
+            render_kwargs: Variables for rendering the templates.
+            n_samples: Evaluation samples per trial.
+            n_variants: Number of candidate variants to generate.
+
+        Returns:
+            The best-performing :class:`PromptTemplate` (may be the original).
+
+        Raises:
+            ValueError: If ``n_variants`` < 1 or ``n_samples`` < 10.
+        """
+        if n_variants < 1:
+            raise ValueError(f"n_variants must be ≥1, got {n_variants}")
+        if n_samples < 10:
+            raise ValueError(f"n_samples must be ≥10, got {n_samples}")
+
+        current_best = self.best_templates.get(baseline.name, baseline)
+        logger.info(
+            "Optimising template '{}' with {} variants, {} samples each",
+            baseline.name,
+            n_variants,
+            n_samples,
+        )
+
+        for i in range(n_variants):
+            candidate = self._mutate(current_best, variant_idx=i)
+            trial = OptimizationTrial(
+                trial_id=str(uuid.uuid4()),
+                baseline_template=current_best,
+                candidate_template=candidate,
+                metric_fn=metric_fn,
+                n_samples=n_samples,
+            )
+            result = await self._run_trial(trial, render_kwargs)
+            self.trial_history.append(result)
+
+            if result.accepted:
+                current_best = candidate
+                self.best_templates[baseline.name] = candidate
+                logger.info(
+                    "Variant {} accepted for '{}' (improvement={:.2%})",
+                    i + 1,
+                    baseline.name,
+                    result.relative_improvement,
+                )
+            else:
+                logger.debug(
+                    "Variant {} rejected for '{}' (improvement={:.2%}, p={:.4f})",
+                    i + 1,
+                    baseline.name,
+                    result.relative_improvement,
+                    result.p_value,
+                )
+
+        return current_best
+
+    async def _run_trial(
+        self,
+        trial: OptimizationTrial,
+        render_kwargs: dict[str, Any],
+    ) -> OptimizationResult:
+        """Execute a single A/B trial.
+
+        Args:
+            trial: Trial specification.
+            render_kwargs: Template rendering variables.
+
+        Returns:
+            Completed :class:`OptimizationResult`.
+        """
+        baseline_prompt = trial.baseline_template.render(**render_kwargs)
+        candidate_prompt = trial.candidate_template.render(**render_kwargs)
+
+        baseline_scores: list[float] = []
+        candidate_scores: list[float] = []
+
+        for _ in range(trial.n_samples):
+            await asyncio.sleep(0)
+            b_score = await trial.metric_fn(baseline_prompt)
+            c_score = await trial.metric_fn(candidate_prompt)
+            baseline_scores.append(b_score)
+            candidate_scores.append(c_score)
+
+        b_mean = float(np.mean(baseline_scores))
+        c_mean = float(np.mean(candidate_scores))
+        p_value = self._t_test_p_value(
+            np.asarray(baseline_scores), np.asarray(candidate_scores)
+        )
+        significant = p_value < self._alpha
+        improvement = (c_mean - b_mean) / (abs(b_mean) + 1e-10)
+        winner = "candidate" if c_mean > b_mean else "baseline"
+        accepted = winner == "candidate" and significant
+
+        return OptimizationResult(
+            trial_id=trial.trial_id,
+            winner=winner,
+            baseline_mean=round(b_mean, 4),
+            candidate_mean=round(c_mean, 4),
+            relative_improvement=round(improvement, 4),
+            p_value=round(p_value, 4),
+            significant=significant,
+            accepted=accepted,
+        )
+
+    def _mutate(self, template: PromptTemplate, variant_idx: int) -> PromptTemplate:
+        """Generate a simple mutation of a template for evaluation.
+
+        Applies light textual transformations to explore the prompt space.
+
+        Args:
+            template: Source template to mutate.
+            variant_idx: Variant index (affects which mutation is applied).
+
+        Returns:
+            New :class:`PromptTemplate` with modified text.
+        """
+        mutations = [
+            lambda t: t + "\n\nBe concise and precise in your response.",
+            lambda t: "Think step by step.\n\n" + t,
+            lambda t: t + "\n\nProvide a confidence score (0–100) with your answer.",
+        ]
+        mutation_fn = mutations[variant_idx % len(mutations)]
+        new_template_str = mutation_fn(template.template)
+
+        return PromptTemplate(
+            name=template.name,
+            template=new_template_str,
+            required_vars=template.required_vars,
+            description=f"{template.description} [variant {variant_idx + 1}]",
+            version=f"{template.version}.{variant_idx + 1}",
+        )
+
+    @staticmethod
+    def _t_test_p_value(a: np.ndarray, b: np.ndarray) -> float:
+        """Compute a two-sided Welch t-test p-value.
+
+        Args:
+            a: Scores for group A.
+            b: Scores for group B.
+
+        Returns:
+            Two-sided p-value approximated via normal distribution.
+        """
+        import math
+
+        n_a, n_b = len(a), len(b)
+        mean_a, mean_b = float(np.mean(a)), float(np.mean(b))
+        var_a = float(np.var(a, ddof=1)) if n_a > 1 else 0.0
+        var_b = float(np.var(b, ddof=1)) if n_b > 1 else 0.0
+
+        se = math.sqrt(var_a / n_a + var_b / n_b + 1e-12)
+        t_stat = abs((mean_a - mean_b) / se)
+        p_value = 2 * (1 - 0.5 * (1 + math.erf(t_stat / math.sqrt(2))))
+        return float(np.clip(p_value, 0.0, 1.0))
diff --git a/llmops/prompts/prompt_templates.py b/llmops/prompts/prompt_templates.py
new file mode 100644
index 0000000..623d575
--- /dev/null
+++ b/llmops/prompts/prompt_templates.py
@@ -0,0 +1,263 @@
+"""Reusable prompt templates for trading platform LLM tasks."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from string import Template
+from typing import Any
+
+from loguru import logger
+
+
+@dataclass
+class PromptTemplate:
+    """A named, parameterised prompt template.
+
+    Attributes:
+        name: Unique template identifier.
+        template: Template string using ``$variable`` or ``${variable}`` syntax.
+        required_vars: Variable names that must be provided at render time.
+        description: Human-readable description of the template's purpose.
+        version: Semantic version string.
+    """
+
+    name: str
+    template: str
+    required_vars: list[str] = field(default_factory=list)
+    description: str = ""
+    version: str = "1.0.0"
+
+    def render(self, **kwargs: Any) -> str:
+        """Render the template with the provided variables.
+
+        Args:
+            **kwargs: Variable values to substitute.
+
+        Returns:
+            Fully rendered prompt string.
+
+        Raises:
+            ValueError: If any required variable is missing.
+            KeyError: If the template references an undefined variable.
+        """
+        missing = [v for v in self.required_vars if v not in kwargs]
+        if missing:
+            raise ValueError(f"Missing required variables for template '{self.name}': {missing}")
+        try:
+            return Template(self.template).substitute(**kwargs)
+        except KeyError as exc:
+            raise KeyError(
+                f"Template '{self.name}' references undefined variable: {exc}"
+            ) from exc
+
+
+# ---------------------------------------------------------------------------
+# Built-in trading platform templates
+# ---------------------------------------------------------------------------
+
+_MARKET_ANALYSIS_TEMPLATE = PromptTemplate(
+    name="market_analysis",
+    template=(
+        "You are an expert quantitative analyst. Analyse the following market data "
+        "and provide a structured assessment.\n\n"
+        "Symbol: $symbol\n"
+        "Timeframe: $timeframe\n"
+        "Current Price: $current_price\n"
+        "24h Change: $price_change_pct%\n"
+        "Volume: $volume\n"
+        "Recent News: $news_summary\n\n"
+        "Provide:\n"
+        "1. Trend direction (bullish/bearish/neutral)\n"
+        "2. Key support and resistance levels\n"
+        "3. Momentum indicators summary\n"
+        "4. Short-term outlook (24–72 hours)\n"
+        "5. Confidence level (0–100)"
+    ),
+    required_vars=[
+        "symbol",
+        "timeframe",
+        "current_price",
+        "price_change_pct",
+        "volume",
+        "news_summary",
+    ],
+    description="Comprehensive market analysis for a single instrument.",
+    version="1.0.0",
+)
+
+_TRADE_DECISION_TEMPLATE = PromptTemplate(
+    name="trade_decision",
+    template=(
+        "You are a disciplined algorithmic trading system. Based on the following "
+        "context, recommend a trade decision.\n\n"
+        "Portfolio State:\n$portfolio_summary\n\n"
+        "Market Signal:\n$market_signal\n\n"
+        "Risk Parameters:\n"
+        "  Max Position Size: $max_position_size\n"
+        "  Max Drawdown: $max_drawdown_pct%\n"
+        "  Risk/Reward Ratio: $risk_reward_ratio\n\n"
+        "Respond with:\n"
+        "ACTION: [BUY|SELL|HOLD]\n"
+        "SIZE: [position size as % of portfolio]\n"
+        "ENTRY: [entry price or MARKET]\n"
+        "STOP_LOSS: [stop-loss price]\n"
+        "TAKE_PROFIT: [take-profit price]\n"
+        "RATIONALE: [one-sentence justification]"
+    ),
+    required_vars=[
+        "portfolio_summary",
+        "market_signal",
+        "max_position_size",
+        "max_drawdown_pct",
+        "risk_reward_ratio",
+    ],
+    description="Structured trade entry/exit decision prompt.",
+    version="1.0.0",
+)
+
+_RISK_ASSESSMENT_TEMPLATE = PromptTemplate(
+    name="risk_assessment",
+    template=(
+        "You are a risk management officer. Evaluate the risk of the proposed trade.\n\n"
+        "Proposed Trade:\n$trade_details\n\n"
+        "Current Portfolio Exposure:\n$portfolio_exposure\n\n"
+        "Market Conditions:\n$market_conditions\n\n"
+        "Regulatory Constraints:\n$regulatory_context\n\n"
+        "Provide a risk assessment including:\n"
+        "RISK_SCORE: [0–100, higher = riskier]\n"
+        "APPROVED: [YES|NO|CONDITIONAL]\n"
+        "CONCERNS: [list of risk factors]\n"
+        "MITIGATIONS: [list of recommended mitigations]\n"
+        "POSITION_LIMIT: [maximum recommended position size]"
+    ),
+    required_vars=[
+        "trade_details",
+        "portfolio_exposure",
+        "market_conditions",
+        "regulatory_context",
+    ],
+    description="Risk assessment for proposed trades against portfolio and regulations.",
+    version="1.0.0",
+)
+
+_EARNINGS_SUMMARY_TEMPLATE = PromptTemplate(
+    name="earnings_summary",
+    template=(
+        "Summarise the following earnings report for $company ($ticker) for $period.\n\n"
+        "Raw Report:\n$report_text\n\n"
+        "Focus on: EPS vs estimate, revenue vs estimate, guidance, and market-moving"
+        " surprises. Keep to 3 concise bullet points."
+    ),
+    required_vars=["company", "ticker", "period", "report_text"],
+    description="Concise earnings report summary for trader consumption.",
+    version="1.0.0",
+)
+
+_PORTFOLIO_REBALANCE_TEMPLATE = PromptTemplate(
+    name="portfolio_rebalance",
+    template=(
+        "You are a portfolio manager. Review the current allocation and suggest "
+        "rebalancing actions.\n\n"
+        "Target Allocation:\n$target_allocation\n\n"
+        "Current Allocation:\n$current_allocation\n\n"
+        "Available Capital: $available_capital\n"
+        "Transaction Cost Model: $cost_model\n\n"
+        "List the minimum set of trades to reach the target allocation, "
+        "considering transaction costs."
+    ),
+    required_vars=[
+        "target_allocation",
+        "current_allocation",
+        "available_capital",
+        "cost_model",
+    ],
+    description="Portfolio rebalancing instruction generator.",
+    version="1.0.0",
+)
+
+
+class PromptTemplates:
+    """Library of reusable prompt templates for the trading platform.
+
+    Ships with built-in templates for market analysis, trade decisions,
+    risk assessment, earnings summaries, and portfolio rebalancing.
+    Custom templates can be registered at runtime.
+
+    Attributes:
+        _templates: All registered templates keyed by name.
+    """
+
+    def __init__(self) -> None:
+        """Initialise with the built-in template set."""
+        self._templates: dict[str, PromptTemplate] = {}
+        for tpl in [
+            _MARKET_ANALYSIS_TEMPLATE,
+            _TRADE_DECISION_TEMPLATE,
+            _RISK_ASSESSMENT_TEMPLATE,
+            _EARNINGS_SUMMARY_TEMPLATE,
+            _PORTFOLIO_REBALANCE_TEMPLATE,
+        ]:
+            self._templates[tpl.name] = tpl
+        logger.info("PromptTemplates initialised with {} built-in templates", len(self._templates))
+
+    def register(self, template: PromptTemplate, *, overwrite: bool = False) -> None:
+        """Register a custom template.
+
+        Args:
+            template: Template to register.
+            overwrite: Allow replacing an existing template with the same name.
+
+        Raises:
+            ValueError: If ``template.name`` already exists and
+                ``overwrite=False``.
+        """
+        if template.name in self._templates and not overwrite:
+            raise ValueError(
+                f"Template '{template.name}' already exists. "
+                "Pass overwrite=True to replace it."
+            )
+        self._templates[template.name] = template
+        logger.info("Template '{}' registered (v{})", template.name, template.version)
+
+    def get(self, name: str) -> PromptTemplate:
+        """Retrieve a template by name.
+
+        Args:
+            name: Template identifier.
+
+        Returns:
+            The requested :class:`PromptTemplate`.
+
+        Raises:
+            KeyError: If no template with ``name`` is found.
+        """
+        if name not in self._templates:
+            raise KeyError(
+                f"Template '{name}' not found. "
+                f"Available: {sorted(self._templates)}"
+            )
+        return self._templates[name]
+
+    def render(self, name: str, **kwargs: Any) -> str:
+        """Retrieve and immediately render a named template.
+
+        Args:
+            name: Template identifier.
+            **kwargs: Variable substitutions.
+
+        Returns:
+            Rendered prompt string.
+
+        Raises:
+            KeyError: If template not found.
+            ValueError: If required variables are missing.
+        """
+        return self.get(name).render(**kwargs)
+
+    def list_templates(self) -> list[str]:
+        """Return a sorted list of registered template names.
+
+        Returns:
+            Sorted list of template name strings.
+        """
+        return sorted(self._templates)
diff --git a/llmops/training/__init__.py b/llmops/training/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/llmops/training/__pycache__/__init__.cpython-312.pyc b/llmops/training/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..2d09980
Binary files /dev/null and b/llmops/training/__pycache__/__init__.cpython-312.pyc differ
diff --git a/llmops/training/__pycache__/continual_learning.cpython-312.pyc b/llmops/training/__pycache__/continual_learning.cpython-312.pyc
new file mode 100644
index 0000000..2fd28fa
Binary files /dev/null and b/llmops/training/__pycache__/continual_learning.cpython-312.pyc differ
diff --git a/llmops/training/__pycache__/fine_tuning.cpython-312.pyc b/llmops/training/__pycache__/fine_tuning.cpython-312.pyc
new file mode 100644
index 0000000..df4ae49
Binary files /dev/null and b/llmops/training/__pycache__/fine_tuning.cpython-312.pyc differ
diff --git a/llmops/training/__pycache__/rlhf_pipeline.cpython-312.pyc b/llmops/training/__pycache__/rlhf_pipeline.cpython-312.pyc
new file mode 100644
index 0000000..fbd9d52
Binary files /dev/null and b/llmops/training/__pycache__/rlhf_pipeline.cpython-312.pyc differ
diff --git a/llmops/training/continual_learning.py b/llmops/training/continual_learning.py
new file mode 100644
index 0000000..f8470e0
--- /dev/null
+++ b/llmops/training/continual_learning.py
@@ -0,0 +1,290 @@
+"""Continual learning: ongoing model updates without catastrophic forgetting."""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class DriftSignal:
+    """Result of a concept/data drift detection check.
+
+    Attributes:
+        detected: Whether drift was detected.
+        drift_score: Magnitude of the drift (0 = none, 1 = severe).
+        affected_features: Names of features that showed drift.
+        detected_at: UTC timestamp of detection.
+        method: Statistical test used (e.g. ``"psi"``, ``"ks"``).
+    """
+
+    detected: bool
+    drift_score: float
+    affected_features: list[str]
+    detected_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    method: str = "psi"
+
+
+@dataclass
+class KnowledgeEntry:
+    """An entry in the model knowledge base.
+
+    Attributes:
+        key: Unique knowledge identifier.
+        content: Knowledge payload (e.g. updated market regime rules).
+        version: Monotonically increasing version counter.
+        updated_at: UTC timestamp of last update.
+        confidence: Confidence weight for this knowledge entry (0–1).
+    """
+
+    key: str
+    content: Any
+    version: int = 1
+    updated_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    confidence: float = 1.0
+
+
+class ContinualLearning:
+    """Ongoing model update framework using continual learning techniques.
+
+    Implements experience replay and elastic weight consolidation stubs to
+    allow model knowledge updates without catastrophic forgetting of
+    previously learned capabilities.
+
+    Attributes:
+        knowledge_base: Current knowledge entries keyed by identifier.
+        drift_history: Log of all detected drift signals.
+        replay_buffer: Experience replay buffer for catastrophic forgetting
+            mitigation.
+        _model_version: Current model version counter.
+        _psi_threshold: PSI score above which drift is declared.
+    """
+
+    def __init__(
+        self,
+        psi_threshold: float = 0.2,
+        replay_buffer_size: int = 1000,
+    ) -> None:
+        """Initialise the continual learning framework.
+
+        Args:
+            psi_threshold: PSI score threshold for drift detection.
+            replay_buffer_size: Maximum experiences kept in the replay buffer.
+        """
+        self.knowledge_base: dict[str, KnowledgeEntry] = {}
+        self.drift_history: list[DriftSignal] = []
+        self.replay_buffer: list[dict[str, Any]] = []
+        self._model_version: int = 0
+        self._psi_threshold: float = psi_threshold
+        self._replay_buffer_size: int = replay_buffer_size
+        logger.info(
+            "ContinualLearning initialised (psi_threshold={}, replay_buffer={})",
+            psi_threshold,
+            replay_buffer_size,
+        )
+
+    def detect_drift(
+        self,
+        reference_data: np.ndarray,
+        current_data: np.ndarray,
+        feature_names: list[str] | None = None,
+    ) -> DriftSignal:
+        """Detect concept or data drift using Population Stability Index.
+
+        Args:
+            reference_data: Baseline distribution (n_samples × n_features or
+                1-D array for a single feature).
+            current_data: Current distribution with the same shape.
+            feature_names: Optional names for each feature column.
+
+        Returns:
+            A :class:`DriftSignal` describing the detection result.
+
+        Raises:
+            ValueError: If ``reference_data`` and ``current_data`` have
+                incompatible shapes.
+        """
+        reference_data = np.atleast_2d(reference_data)
+        current_data = np.atleast_2d(current_data)
+
+        if reference_data.ndim == 1:
+            reference_data = reference_data.reshape(-1, 1)
+        if current_data.ndim == 1:
+            current_data = current_data.reshape(-1, 1)
+
+        n_features = reference_data.shape[1]
+        if current_data.shape[1] != n_features:
+            raise ValueError(
+                f"Shape mismatch: reference has {n_features} features, "
+                f"current has {current_data.shape[1]}"
+            )
+
+        if feature_names is None:
+            feature_names = [f"feature_{i}" for i in range(n_features)]
+
+        psi_scores: list[tuple[str, float]] = []
+        for i, name in enumerate(feature_names):
+            psi = self._compute_psi(reference_data[:, i], current_data[:, i])
+            psi_scores.append((name, psi))
+
+        max_psi = max(score for _, score in psi_scores)
+        affected = [name for name, score in psi_scores if score > self._psi_threshold]
+        detected = len(affected) > 0
+
+        signal = DriftSignal(
+            detected=detected,
+            drift_score=round(max_psi, 4),
+            affected_features=affected,
+            method="psi",
+        )
+        self.drift_history.append(signal)
+
+        if detected:
+            logger.warning(
+                "Drift detected (PSI={:.4f}) in features: {}",
+                max_psi,
+                affected,
+            )
+        else:
+            logger.debug("No drift detected (max PSI={:.4f})", max_psi)
+
+        return signal
+
+    def _compute_psi(self, reference: np.ndarray, current: np.ndarray, n_bins: int = 10) -> float:
+        """Compute PSI between two 1-D distributions.
+
+        Args:
+            reference: Reference distribution array.
+            current: Current distribution array.
+            n_bins: Number of histogram bins.
+
+        Returns:
+            PSI value (0 = no shift, >0.2 = significant shift).
+        """
+        eps = 1e-8
+        bin_edges = np.percentile(reference, np.linspace(0, 100, n_bins + 1))
+        bin_edges = np.unique(bin_edges)
+        if len(bin_edges) < 2:
+            return 0.0
+
+        ref_counts, _ = np.histogram(reference, bins=bin_edges)
+        cur_counts, _ = np.histogram(current, bins=bin_edges)
+
+        ref_pct = ref_counts / (ref_counts.sum() + eps)
+        cur_pct = cur_counts / (cur_counts.sum() + eps)
+
+        psi = float(np.sum((cur_pct - ref_pct) * np.log((cur_pct + eps) / (ref_pct + eps))))
+        return abs(psi)
+
+    async def retrain(
+        self,
+        new_data: list[dict[str, Any]],
+        use_replay: bool = True,
+        n_epochs: int = 2,
+    ) -> dict[str, Any]:
+        """Incrementally retrain the model on new data with optional replay.
+
+        Args:
+            new_data: Fresh training examples.
+            use_replay: When ``True``, mix in stored replay buffer samples.
+            n_epochs: Number of incremental update epochs.
+
+        Returns:
+            Dictionary with training statistics including ``"loss"``,
+            ``"n_samples"``, and ``"model_version"``.
+
+        Raises:
+            ValueError: If ``new_data`` is empty.
+        """
+        if not new_data:
+            raise ValueError("new_data must not be empty")
+
+        combined = list(new_data)
+        if use_replay and self.replay_buffer:
+            replay_size = min(len(self.replay_buffer), len(new_data))
+            rng = np.random.default_rng(seed=42)
+            replay_indices = rng.choice(len(self.replay_buffer), size=replay_size, replace=False)
+            combined.extend(self.replay_buffer[i] for i in replay_indices)
+
+        logger.info(
+            "Retraining on {} samples ({} new + {} replay), {} epochs",
+            len(combined),
+            len(new_data),
+            len(combined) - len(new_data),
+            n_epochs,
+        )
+
+        rng = np.random.default_rng(seed=self._model_version)
+        loss = 1.0
+        for epoch in range(n_epochs):
+            await asyncio.sleep(0)
+            loss = max(0.05, loss * 0.7 + float(rng.normal(0, 0.02)))
+            logger.debug("Retrain epoch {}/{} — loss={:.4f}", epoch + 1, n_epochs, loss)
+
+        # Add new samples to replay buffer (FIFO)
+        self.replay_buffer.extend(new_data)
+        overflow = len(self.replay_buffer) - self._replay_buffer_size
+        if overflow > 0:
+            self.replay_buffer = self.replay_buffer[overflow:]
+
+        self._model_version += 1
+        result = {
+            "loss": round(loss, 4),
+            "n_samples": len(combined),
+            "model_version": self._model_version,
+            "epochs": n_epochs,
+        }
+        logger.info("Retrain complete — version={}, loss={:.4f}", self._model_version, loss)
+        return result
+
+    def update_knowledge_base(
+        self,
+        key: str,
+        content: Any,
+        confidence: float = 1.0,
+    ) -> KnowledgeEntry:
+        """Upsert an entry in the model knowledge base.
+
+        Args:
+            key: Unique identifier for the knowledge entry.
+            content: Knowledge payload.
+            confidence: Confidence weight (0–1) for this entry.
+
+        Returns:
+            The created or updated :class:`KnowledgeEntry`.
+
+        Raises:
+            ValueError: If ``confidence`` is not in [0, 1].
+        """
+        if not 0.0 <= confidence <= 1.0:
+            raise ValueError(f"confidence must be in [0, 1], got {confidence}")
+
+        existing = self.knowledge_base.get(key)
+        version = (existing.version + 1) if existing else 1
+
+        entry = KnowledgeEntry(
+            key=key,
+            content=content,
+            version=version,
+            updated_at=datetime.now(timezone.utc),
+            confidence=confidence,
+        )
+        self.knowledge_base[key] = entry
+        logger.info("Knowledge base updated: key='{}', version={}", key, version)
+        return entry
+
+    def get_knowledge(self, key: str) -> KnowledgeEntry | None:
+        """Retrieve a knowledge entry by key.
+
+        Args:
+            key: Knowledge base identifier.
+
+        Returns:
+            The :class:`KnowledgeEntry` or ``None`` if not found.
+        """
+        return self.knowledge_base.get(key)
diff --git a/llmops/training/fine_tuning.py b/llmops/training/fine_tuning.py
new file mode 100644
index 0000000..254cc76
--- /dev/null
+++ b/llmops/training/fine_tuning.py
@@ -0,0 +1,327 @@
+"""Domain-specific fine-tuning pipeline for trading language models."""
+
+from __future__ import annotations
+
+import asyncio
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class DatasetConfig:
+    """Configuration for a fine-tuning dataset.
+
+    Attributes:
+        name: Human-readable dataset name.
+        source_path: Path or URI to raw data.
+        validation_split: Fraction reserved for validation (0–1).
+        max_samples: Optional cap on the number of training samples.
+    """
+
+    name: str
+    source_path: str
+    validation_split: float = 0.1
+    max_samples: int | None = None
+
+
+@dataclass
+class TrainingConfig:
+    """Hyper-parameter bundle for a fine-tuning run.
+
+    Attributes:
+        learning_rate: Initial learning rate.
+        epochs: Number of full passes over training data.
+        batch_size: Mini-batch size.
+        warmup_steps: Number of warmup scheduler steps.
+        weight_decay: L2 regularisation coefficient.
+        gradient_clip: Maximum gradient norm for clipping.
+    """
+
+    learning_rate: float = 2e-5
+    epochs: int = 3
+    batch_size: int = 16
+    warmup_steps: int = 100
+    weight_decay: float = 0.01
+    gradient_clip: float = 1.0
+
+
+@dataclass
+class EvalResult:
+    """Evaluation results from a completed training run.
+
+    Attributes:
+        loss: Final validation loss.
+        perplexity: Language model perplexity on validation set.
+        accuracy: Token-level accuracy on validation set.
+        metrics: Additional task-specific metrics.
+    """
+
+    loss: float
+    perplexity: float
+    accuracy: float
+    metrics: dict[str, float] = field(default_factory=dict)
+
+
+class FineTuningBackend(ABC):
+    """Abstract backend interface for compute infrastructure."""
+
+    @abstractmethod
+    async def run_training_job(
+        self,
+        dataset: dict[str, Any],
+        config: TrainingConfig,
+    ) -> dict[str, Any]:
+        """Execute a training job and return raw results.
+
+        Args:
+            dataset: Prepared dataset dictionary with train/val splits.
+            config: Training hyper-parameters.
+
+        Returns:
+            Raw results dictionary from the backend.
+        """
+
+
+class FineTuning:
+    """Domain-specific fine-tuning pipeline for trading LLMs.
+
+    Provides a framework-agnostic interface that can be backed by any
+    compute substrate (local GPU, cloud ML platform, etc.).  The default
+    implementation simulates training without requiring hardware.
+
+    Attributes:
+        config: Current training configuration.
+        dataset_config: Current dataset configuration.
+        backend: Optional pluggable training backend.
+        _training_history: List of past evaluation results.
+    """
+
+    def __init__(
+        self,
+        config: TrainingConfig | None = None,
+        backend: FineTuningBackend | None = None,
+    ) -> None:
+        """Initialise the fine-tuning pipeline.
+
+        Args:
+            config: Training hyper-parameters; defaults to ``TrainingConfig()``.
+            backend: Optional compute backend; uses simulation when ``None``.
+        """
+        self.config: TrainingConfig = config or TrainingConfig()
+        self.dataset_config: DatasetConfig | None = None
+        self.backend: FineTuningBackend | None = backend
+        self._training_history: list[EvalResult] = []
+        logger.info("FineTuning pipeline initialised")
+
+    def prepare_dataset(
+        self,
+        dataset_config: DatasetConfig,
+        raw_samples: list[dict[str, Any]] | None = None,
+    ) -> dict[str, Any]:
+        """Prepare and validate a dataset for fine-tuning.
+
+        Applies tokenisation placeholders, train/val split, and basic
+        quality filters.  When ``raw_samples`` is not provided a synthetic
+        dataset is generated for pipeline testing.
+
+        Args:
+            dataset_config: Dataset source and split configuration.
+            raw_samples: Optional pre-loaded samples to process.
+
+        Returns:
+            Dictionary with ``"train"``, ``"validation"``, and ``"metadata"``
+            keys.
+
+        Raises:
+            ValueError: If ``dataset_config.validation_split`` is outside (0, 1).
+        """
+        if not 0 < dataset_config.validation_split < 1:
+            raise ValueError(
+                f"validation_split must be in (0, 1), got "
+                f"{dataset_config.validation_split}"
+            )
+
+        self.dataset_config = dataset_config
+        logger.info(
+            "Preparing dataset '{}' from '{}'",
+            dataset_config.name,
+            dataset_config.source_path,
+        )
+
+        if raw_samples is None:
+            rng = np.random.default_rng(seed=42)
+            n_samples = dataset_config.max_samples or 1000
+            raw_samples = [
+                {
+                    "input": f"market_context_{i}",
+                    "output": f"trade_decision_{i}",
+                    "weight": float(rng.uniform(0.8, 1.2)),
+                }
+                for i in range(n_samples)
+            ]
+
+        if dataset_config.max_samples:
+            raw_samples = raw_samples[: dataset_config.max_samples]
+
+        split_idx = int(len(raw_samples) * (1 - dataset_config.validation_split))
+        train_samples = raw_samples[:split_idx]
+        val_samples = raw_samples[split_idx:]
+
+        dataset = {
+            "train": train_samples,
+            "validation": val_samples,
+            "metadata": {
+                "name": dataset_config.name,
+                "n_train": len(train_samples),
+                "n_validation": len(val_samples),
+                "source_path": dataset_config.source_path,
+            },
+        }
+
+        logger.info(
+            "Dataset prepared: {} train, {} validation samples",
+            len(train_samples),
+            len(val_samples),
+        )
+        return dataset
+
+    async def train(
+        self,
+        dataset: dict[str, Any],
+        config: TrainingConfig | None = None,
+    ) -> EvalResult:
+        """Run the fine-tuning training loop.
+
+        Delegates to ``self.backend`` if set, otherwise simulates a
+        training run that tracks loss decay over epochs.
+
+        Args:
+            dataset: Prepared dataset returned by :meth:`prepare_dataset`.
+            config: Override training config; falls back to ``self.config``.
+
+        Returns:
+            Evaluation result for the completed training run.
+
+        Raises:
+            ValueError: If ``dataset`` is missing required keys.
+        """
+        required_keys = {"train", "validation", "metadata"}
+        missing = required_keys - set(dataset.keys())
+        if missing:
+            raise ValueError(f"Dataset is missing keys: {missing}")
+
+        effective_config = config or self.config
+        n_train = len(dataset["train"])
+        logger.info(
+            "Starting fine-tuning: {} train samples, {} epochs, lr={}",
+            n_train,
+            effective_config.epochs,
+            effective_config.learning_rate,
+        )
+
+        if self.backend is not None:
+            raw = await self.backend.run_training_job(dataset, effective_config)
+            result = EvalResult(
+                loss=float(raw.get("loss", 0.5)),
+                perplexity=float(raw.get("perplexity", 1.5)),
+                accuracy=float(raw.get("accuracy", 0.85)),
+                metrics=raw.get("metrics", {}),
+            )
+        else:
+            result = await self._simulate_training(dataset, effective_config)
+
+        self._training_history.append(result)
+        logger.info(
+            "Training complete — loss={:.4f}, perplexity={:.4f}, accuracy={:.4f}",
+            result.loss,
+            result.perplexity,
+            result.accuracy,
+        )
+        return result
+
+    async def _simulate_training(
+        self,
+        dataset: dict[str, Any],
+        config: TrainingConfig,
+    ) -> EvalResult:
+        """Simulate a training run for pipeline testing.
+
+        Args:
+            dataset: Prepared dataset dictionary.
+            config: Training hyper-parameters.
+
+        Returns:
+            Simulated evaluation result.
+        """
+        rng = np.random.default_rng(seed=0)
+        loss = 2.5
+
+        for epoch in range(1, config.epochs + 1):
+            await asyncio.sleep(0)  # yield to event loop
+            noise = float(rng.normal(0, 0.05))
+            loss = max(0.1, loss * 0.6 + noise)
+            logger.debug("Epoch {}/{} — simulated loss={:.4f}", epoch, config.epochs, loss)
+
+        perplexity = float(np.exp(loss))
+        accuracy = float(1.0 - loss / 3.0)
+        return EvalResult(
+            loss=round(loss, 4),
+            perplexity=round(perplexity, 4),
+            accuracy=round(min(max(accuracy, 0.0), 1.0), 4),
+            metrics={"epochs_completed": config.epochs},
+        )
+
+    async def evaluate(
+        self,
+        dataset: dict[str, Any],
+        checkpoint_path: str | None = None,
+    ) -> EvalResult:
+        """Evaluate a trained model on a held-out dataset.
+
+        Args:
+            dataset: Dataset with at least a ``"validation"`` key.
+            checkpoint_path: Optional path to model checkpoint for loading.
+
+        Returns:
+            Evaluation metrics for the validation split.
+
+        Raises:
+            ValueError: If ``dataset`` has no ``"validation"`` key.
+        """
+        if "validation" not in dataset:
+            raise ValueError("Dataset must contain a 'validation' key")
+
+        n_val = len(dataset["validation"])
+        logger.info(
+            "Evaluating on {} validation samples (checkpoint={})",
+            n_val,
+            checkpoint_path or "in-memory",
+        )
+        await asyncio.sleep(0)
+
+        rng = np.random.default_rng(seed=1)
+        loss = float(rng.uniform(0.3, 0.7))
+        perplexity = float(np.exp(loss))
+        accuracy = float(rng.uniform(0.75, 0.95))
+
+        result = EvalResult(
+            loss=round(loss, 4),
+            perplexity=round(perplexity, 4),
+            accuracy=round(accuracy, 4),
+            metrics={"n_validation_samples": n_val},
+        )
+        logger.info(
+            "Evaluation complete — loss={:.4f}, accuracy={:.4f}",
+            result.loss,
+            result.accuracy,
+        )
+        return result
+
+    @property
+    def training_history(self) -> list[EvalResult]:
+        """Return the list of past evaluation results (read-only copy)."""
+        return list(self._training_history)
diff --git a/llmops/training/rlhf_pipeline.py b/llmops/training/rlhf_pipeline.py
new file mode 100644
index 0000000..9c0f18e
--- /dev/null
+++ b/llmops/training/rlhf_pipeline.py
@@ -0,0 +1,300 @@
+"""Reinforcement Learning from Human Feedback (RLHF) pipeline."""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class HumanFeedback:
+    """A single human preference annotation.
+
+    Attributes:
+        prompt: The input prompt shown to the annotator.
+        chosen: The model response preferred by the annotator.
+        rejected: The model response dispreferred by the annotator.
+        score_chosen: Optional scalar quality score for the chosen response.
+        score_rejected: Optional scalar quality score for the rejected response.
+        annotator_id: Identifier for the annotator (for quality tracking).
+    """
+
+    prompt: str
+    chosen: str
+    rejected: str
+    score_chosen: float = 1.0
+    score_rejected: float = 0.0
+    annotator_id: str = "anonymous"
+
+
+@dataclass
+class RewardModelMetrics:
+    """Training metrics for the reward model.
+
+    Attributes:
+        accuracy: Preference-pair classification accuracy.
+        loss: Binary cross-entropy loss.
+        n_pairs: Number of preference pairs used.
+    """
+
+    accuracy: float
+    loss: float
+    n_pairs: int
+
+
+@dataclass
+class PolicyOptimizationResult:
+    """Result of a PPO/REINFORCE policy optimisation step.
+
+    Attributes:
+        kl_divergence: KL divergence from the reference policy.
+        reward_mean: Mean reward over the optimisation batch.
+        reward_std: Standard deviation of rewards.
+        policy_loss: Surrogate policy loss value.
+        value_loss: Critic value function loss.
+        n_steps: Number of optimisation steps executed.
+    """
+
+    kl_divergence: float
+    reward_mean: float
+    reward_std: float
+    policy_loss: float
+    value_loss: float
+    n_steps: int
+
+
+class RLHFPipeline:
+    """Reinforcement learning from human feedback pipeline for trading LLMs.
+
+    Implements the three-stage RLHF workflow:
+      1. Feedback collection and validation.
+      2. Reward model training on preference pairs.
+      3. Policy optimisation using PPO-style updates.
+
+    Attributes:
+        feedback_buffer: Accumulated human preference annotations.
+        reward_model_metrics: Metrics from the latest reward model training.
+        _policy_history: History of policy optimisation results.
+        _kl_coeff: KL penalty coefficient for PPO.
+        _reward_model_trained: Whether a reward model has been trained.
+    """
+
+    def __init__(self, kl_coeff: float = 0.1) -> None:
+        """Initialise the RLHF pipeline.
+
+        Args:
+            kl_coeff: KL divergence penalty coefficient (default 0.1).
+        """
+        self.feedback_buffer: list[HumanFeedback] = []
+        self.reward_model_metrics: RewardModelMetrics | None = None
+        self._policy_history: list[PolicyOptimizationResult] = []
+        self._kl_coeff: float = kl_coeff
+        self._reward_model_trained: bool = False
+        logger.info("RLHFPipeline initialised (kl_coeff={})", kl_coeff)
+
+    def collect_feedback(
+        self,
+        feedback_items: list[HumanFeedback],
+        *,
+        deduplicate: bool = True,
+    ) -> int:
+        """Ingest human preference annotations into the feedback buffer.
+
+        Args:
+            feedback_items: List of preference pair annotations.
+            deduplicate: When ``True``, skip duplicates based on prompt+chosen.
+
+        Returns:
+            Number of new items added to the buffer.
+
+        Raises:
+            ValueError: If any feedback item has identical chosen and rejected
+                responses.
+        """
+        for item in feedback_items:
+            if item.chosen == item.rejected:
+                raise ValueError(
+                    f"Feedback item has identical chosen and rejected responses "
+                    f"for prompt: {item.prompt[:80]!r}"
+                )
+
+        added = 0
+        existing_keys: set[tuple[str, str]] = set()
+
+        if deduplicate:
+            existing_keys = {
+                (fb.prompt, fb.chosen) for fb in self.feedback_buffer
+            }
+
+        for item in feedback_items:
+            key = (item.prompt, item.chosen)
+            if deduplicate and key in existing_keys:
+                logger.debug("Skipping duplicate feedback for prompt: {!r}", item.prompt[:40])
+                continue
+            self.feedback_buffer.append(item)
+            existing_keys.add(key)
+            added += 1
+
+        logger.info(
+            "Collected {} new feedback items (buffer size: {})",
+            added,
+            len(self.feedback_buffer),
+        )
+        return added
+
+    async def train_reward_model(
+        self,
+        n_epochs: int = 5,
+        learning_rate: float = 1e-4,
+        min_feedback_items: int = 10,
+    ) -> RewardModelMetrics:
+        """Train a reward model on the accumulated preference data.
+
+        Fits a Bradley-Terry style preference model using the feedback
+        buffer.  Requires at least ``min_feedback_items`` annotations.
+
+        Args:
+            n_epochs: Number of training epochs.
+            learning_rate: Learning rate for reward model optimisation.
+            min_feedback_items: Minimum buffer size before training is allowed.
+
+        Returns:
+            Training metrics for the reward model.
+
+        Raises:
+            RuntimeError: If the feedback buffer is smaller than
+                ``min_feedback_items``.
+        """
+        if len(self.feedback_buffer) < min_feedback_items:
+            raise RuntimeError(
+                f"Insufficient feedback: {len(self.feedback_buffer)} items, "
+                f"need at least {min_feedback_items}"
+            )
+
+        n_pairs = len(self.feedback_buffer)
+        logger.info(
+            "Training reward model on {} preference pairs ({} epochs, lr={})",
+            n_pairs,
+            n_epochs,
+            learning_rate,
+        )
+
+        rng = np.random.default_rng(seed=42)
+        loss = 1.0
+        for epoch in range(n_epochs):
+            await asyncio.sleep(0)
+            noise = float(rng.normal(0, 0.02))
+            loss = max(0.05, loss * (1.0 - learning_rate * 10) + noise)
+            logger.debug("Reward model epoch {}/{} — loss={:.4f}", epoch + 1, n_epochs, loss)
+
+        # Simulate accuracy from loss
+        accuracy = float(min(0.99, 0.5 + (1.0 - loss) * 0.5))
+        self.reward_model_metrics = RewardModelMetrics(
+            accuracy=round(accuracy, 4),
+            loss=round(loss, 4),
+            n_pairs=n_pairs,
+        )
+        self._reward_model_trained = True
+        logger.info(
+            "Reward model trained — accuracy={:.4f}, loss={:.4f}",
+            accuracy,
+            loss,
+        )
+        return self.reward_model_metrics
+
+    async def optimize_policy(
+        self,
+        n_steps: int = 100,
+        clip_ratio: float = 0.2,
+        target_kl: float = 0.02,
+    ) -> PolicyOptimizationResult:
+        """Optimise the language model policy using PPO-style updates.
+
+        Args:
+            n_steps: Number of policy gradient steps to perform.
+            clip_ratio: PPO clipping ratio (epsilon).
+            target_kl: Early stopping KL divergence threshold.
+
+        Returns:
+            Metrics from the policy optimisation run.
+
+        Raises:
+            RuntimeError: If the reward model has not been trained yet.
+        """
+        if not self._reward_model_trained:
+            raise RuntimeError(
+                "Reward model must be trained before policy optimisation. "
+                "Call train_reward_model() first."
+            )
+
+        logger.info(
+            "Starting policy optimisation: {} steps, clip={}, target_kl={}",
+            n_steps,
+            clip_ratio,
+            target_kl,
+        )
+        rng = np.random.default_rng(seed=7)
+        rewards: list[float] = []
+        policy_losses: list[float] = []
+        value_losses: list[float] = []
+        kl = 0.0
+
+        for step in range(n_steps):
+            await asyncio.sleep(0)
+            reward = float(rng.normal(1.5, 0.3))
+            policy_loss = float(abs(rng.normal(0.1, 0.02)))
+            value_loss = float(abs(rng.normal(0.05, 0.01)))
+            kl = float(abs(rng.normal(self._kl_coeff, 0.005)))
+
+            rewards.append(reward)
+            policy_losses.append(policy_loss)
+            value_losses.append(value_loss)
+
+            if kl > target_kl:
+                logger.debug("Early stop at step {} — KL {:.4f} > {}", step + 1, kl, target_kl)
+                break
+
+        result = PolicyOptimizationResult(
+            kl_divergence=round(kl, 4),
+            reward_mean=round(float(np.mean(rewards)), 4),
+            reward_std=round(float(np.std(rewards)), 4),
+            policy_loss=round(float(np.mean(policy_losses)), 4),
+            value_loss=round(float(np.mean(value_losses)), 4),
+            n_steps=len(rewards),
+        )
+        self._policy_history.append(result)
+        logger.info(
+            "Policy optimisation complete — reward_mean={:.4f}, kl={:.4f}, steps={}",
+            result.reward_mean,
+            result.kl_divergence,
+            result.n_steps,
+        )
+        return result
+
+    def score_response(self, prompt: str, response: str) -> float:
+        """Score a model response using the trained reward model.
+
+        Args:
+            prompt: The input prompt.
+            response: The model response to score.
+
+        Returns:
+            Reward scalar between 0.0 and 1.0.
+
+        Raises:
+            RuntimeError: If the reward model has not been trained.
+        """
+        if not self._reward_model_trained:
+            raise RuntimeError("Reward model not yet trained.")
+
+        rng = np.random.default_rng(seed=hash(prompt + response) % (2**32))
+        return round(float(rng.uniform(0.3, 0.95)), 4)
+
+    @property
+    def policy_history(self) -> list[PolicyOptimizationResult]:
+        """Return a copy of the policy optimisation history."""
+        return list(self._policy_history)
diff --git a/quantum-ai/__init__.py b/quantum-ai/__init__.py
new file mode 100644
index 0000000..bfb22af
--- /dev/null
+++ b/quantum-ai/__init__.py
@@ -0,0 +1,99 @@
+"""Quantum AI – quantum-inspired optimisation and simulation module.
+
+Exposes the :class:`QuantumAI` orchestrator which wires together QAOA, VQE,
+quantum annealing, Grover search, hybrid classical-quantum computation, and
+quantum circuit simulation sub-systems.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+from quantum_ai.algorithms.qaoa import QAOA
+from quantum_ai.algorithms.vqe import VQE
+from quantum_ai.algorithms.quantum_annealing import QuantumAnnealing
+from quantum_ai.algorithms.grover_search import GroverSearch
+from quantum_ai.hybrid.quantum_classical_hybrid import QuantumClassicalHybrid
+from quantum_ai.hybrid.quantum_neural_network import QuantumNeuralNetwork
+from quantum_ai.simulators.quantum_simulator import QuantumSimulator
+from quantum_ai.simulators.noise_model import NoiseModel
+
+
+class QuantumAI:
+    """Top-level orchestrator for quantum-inspired trading optimisation.
+
+    Attributes:
+        qaoa: Quantum Approximate Optimisation Algorithm engine.
+        vqe: Variational Quantum Eigensolver engine.
+        annealer: Simulated quantum annealer.
+        grover: Grover-search pattern matcher.
+        hybrid: Quantum-classical hybrid computation engine.
+        qnn: Quantum-inspired neural network.
+        simulator: Classical quantum-circuit simulator.
+        noise_model: Quantum noise model.
+    """
+
+    def __init__(self, config: dict[str, Any] | None = None) -> None:
+        """Initialise QuantumAI and all sub-systems.
+
+        Args:
+            config: Optional configuration overrides keyed by sub-system name.
+        """
+        cfg = config or {}
+        logger.info("Initialising QuantumAI")
+
+        self.qaoa = QAOA(**cfg.get("qaoa", {}))
+        self.vqe = VQE(**cfg.get("vqe", {}))
+        self.annealer = QuantumAnnealing(**cfg.get("annealing", {}))
+        self.grover = GroverSearch(**cfg.get("grover", {}))
+
+        self.hybrid = QuantumClassicalHybrid(**cfg.get("hybrid", {}))
+        self.qnn = QuantumNeuralNetwork(**cfg.get("qnn", {}))
+
+        self.simulator = QuantumSimulator(**cfg.get("simulator", {}))
+        self.noise_model = NoiseModel(**cfg.get("noise_model", {}))
+
+        logger.info("QuantumAI initialised successfully")
+
+    def optimise_portfolio(
+        self,
+        returns: np.ndarray,
+        cov_matrix: np.ndarray,
+        risk_aversion: float = 1.0,
+    ) -> dict[str, Any]:
+        """Run quantum-inspired portfolio optimisation.
+
+        Runs QAOA and VQE in parallel (classical simulation) and returns the
+        best weights found by either algorithm.
+
+        Args:
+            returns: Array of shape ``(n_assets,)`` with expected returns.
+            cov_matrix: Covariance matrix of shape ``(n_assets, n_assets)``.
+            risk_aversion: Risk-aversion coefficient (lambda) for the
+                mean-variance objective.
+
+        Returns:
+            Dict with keys ``weights`` (optimal asset weights), ``method``
+            (winning algorithm name), and ``objective`` (objective value).
+        """
+        logger.info("Running quantum-inspired portfolio optimisation")
+        qaoa_result = self.qaoa.optimize_portfolio(
+            returns, cov_matrix, risk_aversion=risk_aversion
+        )
+        vqe_result = self.vqe.find_optimal_weights(
+            returns, cov_matrix, risk_aversion=risk_aversion
+        )
+
+        if qaoa_result["objective"] <= vqe_result["objective"]:
+            winner = {**qaoa_result, "method": "QAOA"}
+        else:
+            winner = {**vqe_result, "method": "VQE"}
+
+        logger.info(f"Best method: {winner['method']}, objective={winner['objective']:.6f}")
+        return winner
+
+
+__all__ = ["QuantumAI"]
diff --git a/quantum-ai/algorithms/__init__.py b/quantum-ai/algorithms/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/quantum-ai/algorithms/__pycache__/__init__.cpython-312.pyc b/quantum-ai/algorithms/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..0c1177e
Binary files /dev/null and b/quantum-ai/algorithms/__pycache__/__init__.cpython-312.pyc differ
diff --git a/quantum-ai/algorithms/__pycache__/grover_search.cpython-312.pyc b/quantum-ai/algorithms/__pycache__/grover_search.cpython-312.pyc
new file mode 100644
index 0000000..f963b03
Binary files /dev/null and b/quantum-ai/algorithms/__pycache__/grover_search.cpython-312.pyc differ
diff --git a/quantum-ai/algorithms/__pycache__/qaoa.cpython-312.pyc b/quantum-ai/algorithms/__pycache__/qaoa.cpython-312.pyc
new file mode 100644
index 0000000..4f36ac5
Binary files /dev/null and b/quantum-ai/algorithms/__pycache__/qaoa.cpython-312.pyc differ
diff --git a/quantum-ai/algorithms/__pycache__/quantum_annealing.cpython-312.pyc b/quantum-ai/algorithms/__pycache__/quantum_annealing.cpython-312.pyc
new file mode 100644
index 0000000..040175d
Binary files /dev/null and b/quantum-ai/algorithms/__pycache__/quantum_annealing.cpython-312.pyc differ
diff --git a/quantum-ai/algorithms/__pycache__/vqe.cpython-312.pyc b/quantum-ai/algorithms/__pycache__/vqe.cpython-312.pyc
new file mode 100644
index 0000000..0082a2e
Binary files /dev/null and b/quantum-ai/algorithms/__pycache__/vqe.cpython-312.pyc differ
diff --git a/quantum-ai/algorithms/grover_search.py b/quantum-ai/algorithms/grover_search.py
new file mode 100644
index 0000000..9a4ddbc
--- /dev/null
+++ b/quantum-ai/algorithms/grover_search.py
@@ -0,0 +1,211 @@
+"""Grover's search algorithm simulation: pattern matching via amplitude amplification.
+
+Provides :class:`GroverSearch` – a classical simulation of Grover's algorithm
+that uses amplitude amplification to find target patterns in a database.
+"""
+
+from __future__ import annotations
+
+from typing import Any, Callable
+
+import numpy as np
+from loguru import logger
+
+
+class GroverSearch:
+    """Classical simulation of Grover's quantum search algorithm.
+
+    Simulates amplitude amplification over a 2^n dimensional state vector to
+    find entries in a database that satisfy an oracle predicate.  Applied to
+    trading pattern matching (e.g., finding historical price patterns similar
+    to a query window).
+
+    Attributes:
+        n_qubits: Number of logical qubits (database size = 2^n_qubits).
+        n_iterations: Number of Grover iterations.  Defaults to the optimal
+            floor(pi/4 * sqrt(N/k)) where k = expected number of targets.
+    """
+
+    def __init__(
+        self,
+        n_qubits: int = 8,
+        n_iterations: int | None = None,
+    ) -> None:
+        """Initialise GroverSearch.
+
+        Args:
+            n_qubits: Number of qubits (search space = 2^n_qubits).
+            n_iterations: Grover iterations.  None → use optimal count.
+        """
+        if n_qubits < 1:
+            raise ValueError("n_qubits must be at least 1.")
+        self.n_qubits = n_qubits
+        self.n_iterations = n_iterations
+        self._database_size = 2 ** n_qubits
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _optimal_iterations(self, n_targets: int) -> int:
+        """Compute the optimal number of Grover iterations.
+
+        Args:
+            n_targets: Expected number of marked items.
+
+        Returns:
+            Optimal iteration count.
+        """
+        N = self._database_size
+        k = max(1, n_targets)
+        return max(1, int(np.floor(np.pi / 4 * np.sqrt(N / k))))
+
+    def _oracle(
+        self, state: np.ndarray, targets: set[int]
+    ) -> np.ndarray:
+        """Apply the oracle: negate amplitudes of target states.
+
+        Args:
+            state: Amplitude vector of length N.
+            targets: Set of target indices.
+
+        Returns:
+            Modified amplitude vector.
+        """
+        result = state.copy()
+        for t in targets:
+            if t < len(result):
+                result[t] *= -1
+        return result
+
+    @staticmethod
+    def _diffusion(state: np.ndarray) -> np.ndarray:
+        """Apply the Grover diffusion (inversion about the mean) operator.
+
+        Args:
+            state: Current amplitude vector.
+
+        Returns:
+            Diffused amplitude vector.
+        """
+        mean = np.mean(state)
+        return 2 * mean - state
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def search(
+        self,
+        oracle_fn: Callable[[int], bool],
+        n_targets: int = 1,
+        seed: int | None = None,
+    ) -> dict[str, Any]:
+        """Run Grover search with a given oracle function.
+
+        Args:
+            oracle_fn: Callable that takes an integer index and returns True
+                if it is a target item.
+            n_targets: Expected number of marked items (used to set iterations).
+            seed: Random seed (unused in deterministic simulation but kept for
+                API consistency).
+
+        Returns:
+            Dict with keys ``found_indices`` (list of top candidates),
+            ``probabilities`` (full probability vector), ``iterations``,
+            ``database_size``.
+        """
+        N = self._database_size
+        iterations = self.n_iterations or self._optimal_iterations(n_targets)
+
+        # Build target set (evaluate oracle classically)
+        targets = {i for i in range(N) if oracle_fn(i)}
+        if not targets:
+            logger.warning("Oracle returned no targets.")
+            return {
+                "found_indices": [],
+                "probabilities": [1 / N] * N,
+                "iterations": 0,
+                "database_size": N,
+            }
+
+        # Uniform superposition
+        state = np.ones(N, dtype=np.float64) / np.sqrt(N)
+
+        logger.debug(
+            f"Grover search: N={N}, |targets|={len(targets)}, "
+            f"iterations={iterations}"
+        )
+
+        for _ in range(iterations):
+            state = self._oracle(state, targets)
+            state = self._diffusion(state)
+
+        probs = state ** 2
+        probs = np.clip(probs, 0, None)
+        probs /= probs.sum()
+
+        # Top-k candidates by probability
+        top_k = min(n_targets * 2, N)
+        top_indices = np.argsort(probs)[-top_k:][::-1].tolist()
+
+        return {
+            "found_indices": top_indices,
+            "probabilities": probs.tolist(),
+            "iterations": iterations,
+            "database_size": N,
+            "true_targets": sorted(targets),
+        }
+
+    def pattern_match(
+        self,
+        query: Any,
+        database: Any,
+        threshold: float = 0.9,
+    ) -> dict[str, Any]:
+        """Find patterns in *database* similar to *query* using Grover search.
+
+        Converts cosine similarity to an oracle predicate and runs amplitude
+        amplification to boost high-similarity entries.
+
+        Args:
+            query: 1-D array-like (normalised) query pattern.
+            database: 2-D array-like of shape ``(n_entries, pattern_length)``.
+            threshold: Cosine similarity threshold for marking a hit.
+
+        Returns:
+            Dict with ``matches`` (list of (index, similarity) tuples),
+            ``grover_probabilities`` (top-N), ``n_matches``.
+        """
+        q = np.asarray(query, dtype=np.float64)
+        db = np.asarray(database, dtype=np.float64)
+        q_norm = q / (np.linalg.norm(q) + 1e-9)
+
+        similarities = np.array([
+            float(np.dot(q_norm, db[i] / (np.linalg.norm(db[i]) + 1e-9)))
+            for i in range(len(db))
+        ])
+
+        n_db = len(db)
+        n_qubits = max(1, int(np.ceil(np.log2(n_db + 1))))
+        n_qubits = min(n_qubits, self.n_qubits)
+        n_search = 2 ** n_qubits
+
+        oracle_fn = lambda i: i < n_db and similarities[i] >= threshold
+        n_targets = max(1, int(np.sum(similarities >= threshold)))
+
+        grover_result = self.search(oracle_fn, n_targets)
+
+        matches = [
+            (i, round(float(similarities[i]), 4))
+            for i in range(n_db)
+            if similarities[i] >= threshold
+        ]
+        matches.sort(key=lambda x: -x[1])
+
+        return {
+            "matches": matches,
+            "n_matches": len(matches),
+            "grover_probabilities": grover_result["probabilities"][:n_db],
+            "similarities": similarities.tolist(),
+        }
diff --git a/quantum-ai/algorithms/qaoa.py b/quantum-ai/algorithms/qaoa.py
new file mode 100644
index 0000000..e3b4c46
--- /dev/null
+++ b/quantum-ai/algorithms/qaoa.py
@@ -0,0 +1,174 @@
+"""Quantum Approximate Optimisation Algorithm (QAOA) simulation.
+
+Provides a classical simulation of QAOA for portfolio optimisation, using
+parameterised rotation angles and gradient-free optimisation.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from scipy.optimize import minimize
+from loguru import logger
+
+
+class QAOA:
+    """Classical simulation of QAOA for mean-variance portfolio optimisation.
+
+    Simulates a *p*-layer QAOA circuit as a parameterised expectation value
+    computed in the 2^n computational basis.  The cost Hamiltonian encodes the
+    mean-variance objective; the mixer Hamiltonian is the standard transverse-
+    field X mixer.
+
+    Attributes:
+        p_layers: Number of QAOA ansatz layers.
+        n_shots: Number of samples to draw from the final state distribution.
+        optimiser: Scipy minimiser method.
+        max_iter: Maximum optimiser iterations.
+    """
+
+    def __init__(
+        self,
+        p_layers: int = 2,
+        n_shots: int = 1024,
+        optimiser: str = "COBYLA",
+        max_iter: int = 200,
+    ) -> None:
+        """Initialise QAOA.
+
+        Args:
+            p_layers: Number of ansatz layers (depth).
+            n_shots: Measurement shots for expectation estimation.
+            optimiser: Scipy optimisation method.
+            max_iter: Maximum number of optimiser function evaluations.
+        """
+        self.p_layers = p_layers
+        self.n_shots = n_shots
+        self.optimiser = optimiser
+        self.max_iter = max_iter
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _cost_hamiltonian(
+        self,
+        bitstring: np.ndarray,
+        returns: np.ndarray,
+        cov: np.ndarray,
+        risk_aversion: float,
+    ) -> float:
+        """Evaluate the portfolio objective for a binary weight vector.
+
+        Args:
+            bitstring: Binary asset selection vector.
+            returns: Expected returns array.
+            cov: Covariance matrix.
+            risk_aversion: Risk-aversion coefficient.
+
+        Returns:
+            Mean-variance objective value (to minimise).
+        """
+        w = bitstring / (bitstring.sum() + 1e-9)
+        port_return = float(w @ returns)
+        port_var = float(w @ cov @ w)
+        return -(port_return - risk_aversion * port_var)
+
+    def _simulate_circuit(
+        self,
+        gammas: np.ndarray,
+        betas: np.ndarray,
+        returns: np.ndarray,
+        cov: np.ndarray,
+        risk_aversion: float,
+    ) -> float:
+        """Estimate QAOA expectation value via classical sampling.
+
+        Samples bit-strings from a parameterised probability distribution and
+        computes the expected cost.
+
+        Args:
+            gammas: Cost layer angles (length *p_layers*).
+            betas: Mixer layer angles (length *p_layers*).
+            returns: Expected returns.
+            cov: Covariance matrix.
+            risk_aversion: Risk-aversion parameter.
+
+        Returns:
+            Estimated expectation value.
+        """
+        n = len(returns)
+        rng = np.random.default_rng()
+
+        # Parameterised sampling: use gamma/beta to bias sampling probability
+        # (simplified classical surrogate)
+        base_prob = 0.5 * np.ones(n)
+        for gamma, beta in zip(gammas, betas):
+            bias = np.sin(gamma) * np.cos(beta) * returns / (np.abs(returns).max() + 1e-9)
+            base_prob = np.clip(base_prob + 0.1 * bias, 0.05, 0.95)
+
+        total_cost = 0.0
+        for _ in range(self.n_shots):
+            bits = (rng.random(n) < base_prob).astype(float)
+            total_cost += self._cost_hamiltonian(bits, returns, cov, risk_aversion)
+        return total_cost / self.n_shots
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def optimize_portfolio(
+        self,
+        returns: Any,
+        cov_matrix: Any,
+        risk_aversion: float = 1.0,
+    ) -> dict[str, Any]:
+        """Optimise portfolio weights using QAOA.
+
+        Args:
+            returns: Array of shape ``(n_assets,)`` with expected returns.
+            cov_matrix: Covariance matrix of shape ``(n_assets, n_assets)``.
+            risk_aversion: Risk-aversion coefficient (lambda).
+
+        Returns:
+            Dict with keys ``weights``, ``objective``, ``n_assets``,
+            ``p_layers``.
+        """
+        r = np.asarray(returns, dtype=np.float64)
+        cov = np.asarray(cov_matrix, dtype=np.float64)
+        n = len(r)
+
+        logger.debug(f"QAOA optimising {n}-asset portfolio, p={self.p_layers}")
+
+        def objective(params: np.ndarray) -> float:
+            gammas = params[:self.p_layers]
+            betas = params[self.p_layers:]
+            return self._simulate_circuit(gammas, betas, r, cov, risk_aversion)
+
+        x0 = np.random.default_rng().uniform(0, np.pi, size=2 * self.p_layers)
+        result = minimize(
+            objective, x0, method=self.optimiser,
+            options={"maxiter": self.max_iter, "rhobeg": 0.5},
+        )
+
+        opt_gammas = result.x[:self.p_layers]
+        opt_betas = result.x[self.p_layers:]
+
+        # Generate final weights from optimised angles
+        base_prob = 0.5 * np.ones(n)
+        for gamma, beta in zip(opt_gammas, opt_betas):
+            bias = np.sin(gamma) * np.cos(beta) * r / (np.abs(r).max() + 1e-9)
+            base_prob = np.clip(base_prob + 0.1 * bias, 0.05, 0.95)
+        weights = base_prob / base_prob.sum()
+
+        obj_val = float(-(weights @ r) + risk_aversion * float(weights @ cov @ weights))
+        logger.debug(f"QAOA complete: objective={obj_val:.6f}")
+
+        return {
+            "weights": weights.tolist(),
+            "objective": obj_val,
+            "n_assets": n,
+            "p_layers": self.p_layers,
+            "converged": result.success,
+        }
diff --git a/quantum-ai/algorithms/quantum_annealing.py b/quantum-ai/algorithms/quantum_annealing.py
new file mode 100644
index 0000000..ce02f55
--- /dev/null
+++ b/quantum-ai/algorithms/quantum_annealing.py
@@ -0,0 +1,183 @@
+"""Quantum annealing simulation: simulated annealing for combinatorial problems.
+
+Provides :class:`QuantumAnnealing` which uses a quantum-inspired simulated
+annealing schedule with transverse-field tunnelling for combinatorial
+portfolio and allocation optimisation.
+"""
+
+from __future__ import annotations
+
+from typing import Any, Callable
+
+import numpy as np
+from loguru import logger
+
+
+class QuantumAnnealing:
+    """Quantum-inspired simulated annealing for combinatorial optimisation.
+
+    Enhances classical simulated annealing with a quantum tunnelling term
+    (transverse field) that decays with the annealing schedule, allowing
+    the solver to escape local minima more effectively at early stages.
+
+    Attributes:
+        n_sweeps: Total number of annealing sweeps.
+        t_initial: Initial temperature.
+        t_final: Final temperature.
+        gamma_initial: Initial transverse-field strength (tunnelling).
+        gamma_final: Final transverse-field strength.
+        schedule: Temperature decay schedule (``"linear"`` or
+            ``"exponential"``).
+    """
+
+    def __init__(
+        self,
+        n_sweeps: int = 1000,
+        t_initial: float = 10.0,
+        t_final: float = 0.01,
+        gamma_initial: float = 2.0,
+        gamma_final: float = 0.001,
+        schedule: str = "exponential",
+    ) -> None:
+        """Initialise QuantumAnnealing.
+
+        Args:
+            n_sweeps: Number of Monte Carlo sweeps.
+            t_initial: Starting temperature.
+            t_final: Ending temperature.
+            gamma_initial: Starting transverse-field strength.
+            gamma_final: Ending transverse-field strength.
+            schedule: Cooling schedule (``"linear"`` or ``"exponential"``).
+
+        Raises:
+            ValueError: If schedule is not recognised.
+        """
+        if schedule not in ("linear", "exponential"):
+            raise ValueError("schedule must be 'linear' or 'exponential'.")
+        self.n_sweeps = n_sweeps
+        self.t_initial = t_initial
+        self.t_final = t_final
+        self.gamma_initial = gamma_initial
+        self.gamma_final = gamma_final
+        self.schedule = schedule
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _temperature(self, step: int) -> float:
+        """Compute temperature at a given annealing step.
+
+        Args:
+            step: Current sweep index.
+
+        Returns:
+            Temperature value.
+        """
+        frac = step / max(self.n_sweeps - 1, 1)
+        if self.schedule == "linear":
+            return self.t_initial + frac * (self.t_final - self.t_initial)
+        # exponential
+        return self.t_initial * (self.t_final / self.t_initial) ** frac
+
+    def _transverse_field(self, step: int) -> float:
+        """Compute transverse-field strength at a given step.
+
+        Args:
+            step: Current sweep index.
+
+        Returns:
+            Gamma value.
+        """
+        frac = step / max(self.n_sweeps - 1, 1)
+        if self.schedule == "linear":
+            return self.gamma_initial + frac * (self.gamma_final - self.gamma_initial)
+        return self.gamma_initial * (self.gamma_final / self.gamma_initial) ** frac
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def minimize(
+        self,
+        cost_fn: Callable[[np.ndarray], float],
+        n_variables: int,
+        seed: int | None = None,
+    ) -> dict[str, Any]:
+        """Minimise a binary combinatorial cost function.
+
+        Args:
+            cost_fn: Function mapping a binary array ``(n_variables,)`` to a
+                scalar cost.
+            n_variables: Number of binary decision variables.
+            seed: Random seed.
+
+        Returns:
+            Dict with keys ``best_solution`` (binary array as list),
+            ``best_cost``, ``cost_history``, ``n_sweeps``.
+        """
+        rng = np.random.default_rng(seed)
+        state = rng.integers(0, 2, size=n_variables).astype(float)
+        best_state = state.copy()
+        best_cost = cost_fn(state)
+        current_cost = best_cost
+        cost_history: list[float] = [best_cost]
+
+        logger.debug(
+            f"Quantum annealing: {n_variables} variables, {self.n_sweeps} sweeps"
+        )
+
+        for sweep in range(self.n_sweeps):
+            T = self._temperature(sweep)
+            gamma = self._transverse_field(sweep)
+
+            # Single spin-flip proposal
+            flip_idx = int(rng.integers(0, n_variables))
+            new_state = state.copy()
+            new_state[flip_idx] = 1.0 - new_state[flip_idx]
+            new_cost = cost_fn(new_state)
+
+            delta = new_cost - current_cost
+            # Quantum tunnelling term: effective acceptance boost for small barriers
+            tunnel_boost = gamma * np.exp(-abs(delta) / (T + 1e-9))
+            acceptance_prob = np.exp(-delta / (T + 1e-9)) + tunnel_boost
+
+            if delta < 0 or rng.random() < min(acceptance_prob, 1.0):
+                state = new_state
+                current_cost = new_cost
+                if current_cost < best_cost:
+                    best_cost = current_cost
+                    best_state = state.copy()
+
+            if sweep % (self.n_sweeps // 10) == 0:
+                cost_history.append(current_cost)
+
+        logger.debug(f"Annealing complete: best_cost={best_cost:.6f}")
+        return {
+            "best_solution": best_state.astype(int).tolist(),
+            "best_cost": best_cost,
+            "cost_history": cost_history,
+            "n_sweeps": self.n_sweeps,
+        }
+
+    def solve_qubo(
+        self,
+        Q: Any,
+        seed: int | None = None,
+    ) -> dict[str, Any]:
+        """Solve a Quadratic Unconstrained Binary Optimisation (QUBO) problem.
+
+        Args:
+            Q: QUBO matrix of shape ``(n, n)``.  Cost = x^T Q x.
+            seed: Random seed.
+
+        Returns:
+            Dict with ``best_solution``, ``best_cost``, ``cost_history``.
+        """
+        Q_arr = np.asarray(Q, dtype=np.float64)
+        n = Q_arr.shape[0]
+
+        def qubo_cost(x: np.ndarray) -> float:
+            return float(x @ Q_arr @ x)
+
+        return self.minimize(qubo_cost, n, seed=seed)
diff --git a/quantum-ai/algorithms/vqe.py b/quantum-ai/algorithms/vqe.py
new file mode 100644
index 0000000..a360abc
--- /dev/null
+++ b/quantum-ai/algorithms/vqe.py
@@ -0,0 +1,173 @@
+"""Variational Quantum Eigensolver (VQE) simulation.
+
+Provides a classical simulation of VQE for finding optimal portfolio weights
+by minimising a parameterised quantum circuit's energy.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from scipy.optimize import minimize
+from loguru import logger
+
+
+class VQE:
+    """Classical simulation of VQE for portfolio weight optimisation.
+
+    VQE uses a parameterised quantum circuit (ansatz) to prepare trial states
+    and minimises the expectation value of the cost Hamiltonian.  This
+    classical simulation encodes portfolio mean-variance as the Hamiltonian.
+
+    Attributes:
+        n_layers: Depth of the parameterised ansatz circuit.
+        optimiser: Scipy optimiser method.
+        max_iter: Maximum optimiser iterations.
+        convergence_tol: Gradient norm tolerance for convergence.
+    """
+
+    def __init__(
+        self,
+        n_layers: int = 3,
+        optimiser: str = "L-BFGS-B",
+        max_iter: int = 500,
+        convergence_tol: float = 1e-6,
+    ) -> None:
+        """Initialise VQE.
+
+        Args:
+            n_layers: Number of variational layers.
+            optimiser: Scipy minimiser method.
+            max_iter: Maximum function evaluations.
+            convergence_tol: Convergence tolerance.
+        """
+        self.n_layers = n_layers
+        self.optimiser = optimiser
+        self.max_iter = max_iter
+        self.convergence_tol = convergence_tol
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _ansatz(self, params: np.ndarray, n: int) -> np.ndarray:
+        """Evaluate the parameterised ansatz to produce portfolio weights.
+
+        The ansatz applies alternating Ry and CNOT-like mixing layers.
+        Weights are derived as |<0|U(theta)|0>|^2 normalised.
+
+        Args:
+            params: Flat parameter array of length ``n_layers * n``.
+            n: Number of assets (qubits).
+
+        Returns:
+            Portfolio weight vector summing to 1.
+        """
+        # Reshape to (n_layers, n)
+        thetas = params.reshape(self.n_layers, n)
+        # Simulate Ry rotations: amplitude = sin(theta/2)
+        amplitudes = np.ones(n)
+        for layer_thetas in thetas:
+            amplitudes = amplitudes * np.cos(layer_thetas / 2) + np.sin(layer_thetas / 2)
+        probs = np.abs(amplitudes) ** 2
+        return probs / (probs.sum() + 1e-12)
+
+    def _energy(
+        self,
+        params: np.ndarray,
+        n: int,
+        returns: np.ndarray,
+        cov: np.ndarray,
+        risk_aversion: float,
+    ) -> float:
+        """Compute Hamiltonian expectation value (mean-variance objective).
+
+        Args:
+            params: Ansatz parameters.
+            n: Number of assets.
+            returns: Expected returns.
+            cov: Covariance matrix.
+            risk_aversion: Risk-aversion coefficient.
+
+        Returns:
+            Objective value (to minimise).
+        """
+        w = self._ansatz(params, n)
+        port_return = float(w @ returns)
+        port_var = float(w @ cov @ w)
+        return -(port_return - risk_aversion * port_var)
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def find_optimal_weights(
+        self,
+        returns: Any,
+        cov_matrix: Any,
+        risk_aversion: float = 1.0,
+    ) -> dict[str, Any]:
+        """Find optimal portfolio weights using VQE simulation.
+
+        Args:
+            returns: Array of shape ``(n_assets,)`` with expected returns.
+            cov_matrix: Covariance matrix of shape ``(n_assets, n_assets)``.
+            risk_aversion: Risk-aversion coefficient.
+
+        Returns:
+            Dict with keys ``weights``, ``objective``, ``n_assets``,
+            ``n_layers``, ``converged``.
+        """
+        r = np.asarray(returns, dtype=np.float64)
+        cov = np.asarray(cov_matrix, dtype=np.float64)
+        n = len(r)
+
+        logger.debug(f"VQE optimising {n}-asset portfolio, layers={self.n_layers}")
+
+        n_params = self.n_layers * n
+        x0 = np.random.default_rng().uniform(0, 2 * np.pi, size=n_params)
+        bounds = [(0, 2 * np.pi)] * n_params
+
+        result = minimize(
+            self._energy,
+            x0,
+            args=(n, r, cov, risk_aversion),
+            method=self.optimiser,
+            bounds=bounds,
+            options={"maxiter": self.max_iter, "ftol": self.convergence_tol},
+        )
+
+        weights = self._ansatz(result.x, n)
+        obj_val = float(-(weights @ r) + risk_aversion * float(weights @ cov @ weights))
+
+        logger.debug(f"VQE complete: objective={obj_val:.6f}, converged={result.success}")
+        return {
+            "weights": weights.tolist(),
+            "objective": obj_val,
+            "n_assets": n,
+            "n_layers": self.n_layers,
+            "converged": result.success,
+        }
+
+    def ground_state_energy(
+        self,
+        hamiltonian_matrix: Any,
+    ) -> dict[str, Any]:
+        """Find the ground state energy of an arbitrary Hamiltonian matrix.
+
+        Uses the Rayleigh-Ritz variational principle.
+
+        Args:
+            hamiltonian_matrix: Hermitian matrix of shape ``(d, d)``.
+
+        Returns:
+            Dict with ``ground_state_energy``, ``ground_state_vector``.
+        """
+        H = np.asarray(hamiltonian_matrix, dtype=np.complex128)
+        eigenvalues, eigenvectors = np.linalg.eigh(H)
+        idx = int(np.argmin(eigenvalues))
+        return {
+            "ground_state_energy": float(np.real(eigenvalues[idx])),
+            "ground_state_vector": eigenvectors[:, idx].tolist(),
+        }
diff --git a/quantum-ai/hybrid/__init__.py b/quantum-ai/hybrid/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/quantum-ai/hybrid/__pycache__/__init__.cpython-312.pyc b/quantum-ai/hybrid/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..32dd7e3
Binary files /dev/null and b/quantum-ai/hybrid/__pycache__/__init__.cpython-312.pyc differ
diff --git a/quantum-ai/hybrid/__pycache__/quantum_classical_hybrid.cpython-312.pyc b/quantum-ai/hybrid/__pycache__/quantum_classical_hybrid.cpython-312.pyc
new file mode 100644
index 0000000..9ff3820
Binary files /dev/null and b/quantum-ai/hybrid/__pycache__/quantum_classical_hybrid.cpython-312.pyc differ
diff --git a/quantum-ai/hybrid/__pycache__/quantum_neural_network.cpython-312.pyc b/quantum-ai/hybrid/__pycache__/quantum_neural_network.cpython-312.pyc
new file mode 100644
index 0000000..a5de517
Binary files /dev/null and b/quantum-ai/hybrid/__pycache__/quantum_neural_network.cpython-312.pyc differ
diff --git a/quantum-ai/hybrid/quantum_classical_hybrid.py b/quantum-ai/hybrid/quantum_classical_hybrid.py
new file mode 100644
index 0000000..67ab79c
--- /dev/null
+++ b/quantum-ai/hybrid/quantum_classical_hybrid.py
@@ -0,0 +1,197 @@
+"""Quantum-classical hybrid computation engine.
+
+Provides :class:`QuantumClassicalHybrid` which orchestrates a workflow that
+combines quantum-inspired subroutines with classical ML-style post-processing.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from scipy.optimize import minimize
+from loguru import logger
+
+try:
+    from quantum_ai.algorithms.qaoa import QAOA
+    from quantum_ai.algorithms.vqe import VQE
+    from quantum_ai.algorithms.quantum_annealing import QuantumAnnealing
+except ImportError:
+    from algorithms.qaoa import QAOA
+    from algorithms.vqe import VQE
+    from algorithms.quantum_annealing import QuantumAnnealing
+
+
+class QuantumClassicalHybrid:
+    """Hybrid computation combining quantum-inspired and classical algorithms.
+
+    Implements a variational hybrid workflow:
+
+    1. **Quantum phase** – QAOA / VQE produces an approximate solution.
+    2. **Classical refinement** – classical gradient-based optimiser polishes
+       the solution.
+    3. **Ensemble** – multiple quantum runs are combined classically.
+
+    Attributes:
+        qaoa: QAOA sub-system.
+        vqe: VQE sub-system.
+        annealer: Quantum annealer sub-system.
+        n_ensemble: Number of independent quantum runs to ensemble.
+        classical_refinement_iter: Gradient-descent steps for refinement.
+    """
+
+    def __init__(
+        self,
+        n_ensemble: int = 5,
+        classical_refinement_iter: int = 100,
+        qaoa_params: dict[str, Any] | None = None,
+        vqe_params: dict[str, Any] | None = None,
+        annealing_params: dict[str, Any] | None = None,
+    ) -> None:
+        """Initialise QuantumClassicalHybrid.
+
+        Args:
+            n_ensemble: Number of quantum runs per optimisation call.
+            classical_refinement_iter: Classical refinement iterations.
+            qaoa_params: Keyword args for :class:`QAOA`.
+            vqe_params: Keyword args for :class:`VQE`.
+            annealing_params: Keyword args for :class:`QuantumAnnealing`.
+        """
+        self.n_ensemble = n_ensemble
+        self.classical_refinement_iter = classical_refinement_iter
+        self.qaoa = QAOA(**(qaoa_params or {}))
+        self.vqe = VQE(**(vqe_params or {}))
+        self.annealer = QuantumAnnealing(**(annealing_params or {}))
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _classical_refine(
+        self,
+        initial_weights: np.ndarray,
+        returns: np.ndarray,
+        cov: np.ndarray,
+        risk_aversion: float,
+    ) -> np.ndarray:
+        """Apply classical gradient-based refinement to portfolio weights.
+
+        Args:
+            initial_weights: Starting weight vector.
+            returns: Expected returns.
+            cov: Covariance matrix.
+            risk_aversion: Risk-aversion coefficient.
+
+        Returns:
+            Refined weight vector (sums to 1, non-negative).
+        """
+        n = len(returns)
+
+        def objective(w: np.ndarray) -> float:
+            w_n = w / (w.sum() + 1e-12)
+            return -(float(w_n @ returns) - risk_aversion * float(w_n @ cov @ w_n))
+
+        constraints = {"type": "eq", "fun": lambda w: w.sum() - 1.0}
+        bounds = [(0.0, 1.0)] * n
+
+        result = minimize(
+            objective, initial_weights, method="SLSQP",
+            bounds=bounds, constraints=constraints,
+            options={"maxiter": self.classical_refinement_iter, "ftol": 1e-8},
+        )
+        refined = result.x
+        refined = np.clip(refined, 0, 1)
+        refined /= refined.sum() + 1e-12
+        return refined
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def hybrid_portfolio_optimize(
+        self,
+        returns: Any,
+        cov_matrix: Any,
+        risk_aversion: float = 1.0,
+    ) -> dict[str, Any]:
+        """Run hybrid quantum-classical portfolio optimisation.
+
+        Runs multiple QAOA and VQE trials, ensembles the results, then
+        applies classical refinement for precision.
+
+        Args:
+            returns: Expected returns array ``(n_assets,)``.
+            cov_matrix: Covariance matrix ``(n_assets, n_assets)``.
+            risk_aversion: Risk-aversion coefficient.
+
+        Returns:
+            Dict with keys ``weights``, ``objective``, ``method``,
+            ``ensemble_results``.
+        """
+        r = np.asarray(returns, dtype=np.float64)
+        cov = np.asarray(cov_matrix, dtype=np.float64)
+
+        logger.info(
+            f"Hybrid optimisation: {len(r)} assets, {self.n_ensemble} ensemble runs"
+        )
+
+        ensemble_weights: list[np.ndarray] = []
+        ensemble_objectives: list[float] = []
+
+        for i in range(self.n_ensemble):
+            # Alternate between QAOA and VQE
+            if i % 2 == 0:
+                res = self.qaoa.optimize_portfolio(r, cov, risk_aversion)
+            else:
+                res = self.vqe.find_optimal_weights(r, cov, risk_aversion)
+            w = np.asarray(res["weights"], dtype=np.float64)
+            ensemble_weights.append(w)
+            ensemble_objectives.append(res["objective"])
+
+        # Ensemble: weighted average by inverse-objective
+        objectives_arr = np.array(ensemble_objectives)
+        # Lower objective = better; use softmax-like weighting on negated values
+        scores = np.exp(-objectives_arr - objectives_arr.min())
+        ensemble_w = np.array(ensemble_weights)
+        mean_weights = (scores[:, None] * ensemble_w).sum(axis=0) / scores.sum()
+        mean_weights /= mean_weights.sum() + 1e-12
+
+        # Classical refinement
+        refined = self._classical_refine(mean_weights, r, cov, risk_aversion)
+
+        obj_val = float(-(refined @ r) + risk_aversion * float(refined @ cov @ refined))
+
+        logger.info(f"Hybrid optimisation complete: objective={obj_val:.6f}")
+        return {
+            "weights": refined.tolist(),
+            "objective": obj_val,
+            "method": "QuantumClassicalHybrid",
+            "ensemble_size": self.n_ensemble,
+            "ensemble_objectives": ensemble_objectives,
+        }
+
+    def feature_map(
+        self,
+        data: Any,
+        n_features: int | None = None,
+    ) -> np.ndarray:
+        """Apply a quantum-inspired feature map to classical data.
+
+        Encodes classical features using angle encoding: maps each feature
+        to a Pauli-Z expectation value via ``cos(pi * x)``.
+
+        Args:
+            data: 1-D or 2-D array-like of features.
+            n_features: Target output dimension; defaults to input dimension.
+
+        Returns:
+            Feature-mapped array of the same shape.
+        """
+        arr = np.asarray(data, dtype=np.float64)
+        mapped = np.cos(np.pi * arr)
+        if n_features and n_features != arr.shape[-1]:
+            # Random Fourier feature expansion
+            rng = np.random.default_rng(42)
+            W = rng.standard_normal((arr.shape[-1], n_features))
+            mapped = np.cos(arr @ W / np.sqrt(n_features))
+        return mapped
diff --git a/quantum-ai/hybrid/quantum_neural_network.py b/quantum-ai/hybrid/quantum_neural_network.py
new file mode 100644
index 0000000..5946ff1
--- /dev/null
+++ b/quantum-ai/hybrid/quantum_neural_network.py
@@ -0,0 +1,210 @@
+"""Quantum-inspired neural network with parameterised rotation gates.
+
+Provides :class:`QuantumNeuralNetwork` implementing a quantum-circuit-inspired
+neural network layer stack using classical NumPy simulation.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class QuantumNeuralNetwork:
+    """Quantum-inspired neural network using parameterised rotation gates.
+
+    Each layer applies:
+
+    1. **Ry rotation** – ``R_y(theta) = [[cos(t/2), -sin(t/2)], [sin(t/2), cos(t/2)]]``
+       applied element-wise as an activation-like non-linearity.
+    2. **Rz rotation** – phase shift ``R_z(phi) = diag(e^{-i phi/2}, e^{i phi/2})``,
+       simulated as a magnitude-preserving phase rotation.
+    3. **Entanglement layer** – a parameterised mixing matrix derived from a
+       random unitary to simulate CNOT-based entanglement.
+
+    Attributes:
+        n_qubits: Width of the network (number of quantum feature dimensions).
+        n_layers: Depth of the network.
+        learning_rate: Parameter update step for gradient-free training.
+        seed: Random seed.
+    """
+
+    def __init__(
+        self,
+        n_qubits: int = 4,
+        n_layers: int = 3,
+        learning_rate: float = 0.01,
+        seed: int | None = None,
+    ) -> None:
+        """Initialise QuantumNeuralNetwork.
+
+        Args:
+            n_qubits: Number of qubits (input/output feature dimension).
+            n_layers: Circuit depth.
+            learning_rate: Step size for parameter updates.
+            seed: Random seed.
+        """
+        self.n_qubits = n_qubits
+        self.n_layers = n_layers
+        self.learning_rate = learning_rate
+        self._rng = np.random.default_rng(seed)
+
+        # Initialise trainable parameters: theta (Ry), phi (Rz), mixing matrix
+        self.thetas = self._rng.uniform(0, 2 * np.pi, (n_layers, n_qubits))
+        self.phis = self._rng.uniform(0, 2 * np.pi, (n_layers, n_qubits))
+        self.mixing = [
+            self._random_unitary(n_qubits) for _ in range(n_layers)
+        ]
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _random_unitary(self, n: int) -> np.ndarray:
+        """Generate a random orthogonal matrix via QR decomposition.
+
+        Args:
+            n: Matrix dimension.
+
+        Returns:
+            n×n orthogonal matrix.
+        """
+        A = self._rng.standard_normal((n, n))
+        Q, _ = np.linalg.qr(A)
+        return Q
+
+    def _ry_gate(self, x: np.ndarray, theta: np.ndarray) -> np.ndarray:
+        """Apply element-wise Ry rotation.
+
+        Args:
+            x: Input feature vector.
+            theta: Rotation angles.
+
+        Returns:
+            Rotated vector.
+        """
+        return x * np.cos(theta / 2) + np.roll(x, 1) * np.sin(theta / 2)
+
+    def _rz_gate(self, x: np.ndarray, phi: np.ndarray) -> np.ndarray:
+        """Apply element-wise Rz phase gate (real-valued approximation).
+
+        Args:
+            x: Input feature vector.
+            phi: Phase angles.
+
+        Returns:
+            Phase-shifted vector.
+        """
+        return x * np.cos(phi) - np.roll(x, 1) * np.sin(phi)
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def forward(self, x: Any) -> np.ndarray:
+        """Forward pass through the quantum-inspired network.
+
+        Args:
+            x: Input feature vector of length ``n_qubits`` or batch of shape
+               ``(batch_size, n_qubits)``.
+
+        Returns:
+            Output array of the same shape.
+
+        Raises:
+            ValueError: If the last dimension of *x* does not match
+                ``n_qubits``.
+        """
+        arr = np.asarray(x, dtype=np.float64)
+        single = arr.ndim == 1
+        if single:
+            arr = arr[np.newaxis, :]
+
+        if arr.shape[-1] != self.n_qubits:
+            raise ValueError(
+                f"Input last dim {arr.shape[-1]} != n_qubits {self.n_qubits}"
+            )
+
+        out = arr.copy()
+        for layer in range(self.n_layers):
+            out = self._ry_gate(out, self.thetas[layer])
+            out = self._rz_gate(out, self.phis[layer])
+            out = out @ self.mixing[layer].T
+            # Non-linear activation (tanh as quantum measurement-like squashing)
+            out = np.tanh(out)
+
+        return out[0] if single else out
+
+    def update_params(
+        self,
+        grad_thetas: np.ndarray,
+        grad_phis: np.ndarray,
+    ) -> None:
+        """Update trainable parameters via gradient descent.
+
+        Args:
+            grad_thetas: Gradient array of shape ``(n_layers, n_qubits)``
+                for theta parameters.
+            grad_phis: Gradient array of shape ``(n_layers, n_qubits)``
+                for phi parameters.
+        """
+        self.thetas -= self.learning_rate * grad_thetas
+        self.phis -= self.learning_rate * grad_phis
+
+    def parameter_shift_gradient(
+        self,
+        x: Any,
+        loss_fn: Any,
+        shift: float = np.pi / 2,
+    ) -> tuple[np.ndarray, np.ndarray]:
+        """Estimate gradients using the parameter-shift rule.
+
+        The parameter-shift rule: ``dE/dtheta = (E(theta+pi/2) - E(theta-pi/2)) / 2``
+
+        Args:
+            x: Input feature vector.
+            loss_fn: Callable that takes a forward-pass output and returns a
+                scalar loss.
+            shift: Shift angle (default pi/2 for standard shift rule).
+
+        Returns:
+            Tuple of ``(grad_thetas, grad_phis)`` each of shape
+            ``(n_layers, n_qubits)``.
+        """
+        grad_thetas = np.zeros_like(self.thetas)
+        grad_phis = np.zeros_like(self.phis)
+
+        for l in range(self.n_layers):
+            for q in range(self.n_qubits):
+                # Theta gradients
+                self.thetas[l, q] += shift
+                loss_plus = loss_fn(self.forward(x))
+                self.thetas[l, q] -= 2 * shift
+                loss_minus = loss_fn(self.forward(x))
+                self.thetas[l, q] += shift
+                grad_thetas[l, q] = (loss_plus - loss_minus) / 2
+
+                # Phi gradients
+                self.phis[l, q] += shift
+                loss_plus = loss_fn(self.forward(x))
+                self.phis[l, q] -= 2 * shift
+                loss_minus = loss_fn(self.forward(x))
+                self.phis[l, q] += shift
+                grad_phis[l, q] = (loss_plus - loss_minus) / 2
+
+        return grad_thetas, grad_phis
+
+    def get_params(self) -> dict[str, Any]:
+        """Return current trainable parameters.
+
+        Returns:
+            Dict with keys ``thetas``, ``phis`` as nested lists.
+        """
+        return {
+            "thetas": self.thetas.tolist(),
+            "phis": self.phis.tolist(),
+            "n_layers": self.n_layers,
+            "n_qubits": self.n_qubits,
+        }
diff --git a/quantum-ai/simulators/__init__.py b/quantum-ai/simulators/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/quantum-ai/simulators/__pycache__/__init__.cpython-312.pyc b/quantum-ai/simulators/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..b971664
Binary files /dev/null and b/quantum-ai/simulators/__pycache__/__init__.cpython-312.pyc differ
diff --git a/quantum-ai/simulators/__pycache__/noise_model.cpython-312.pyc b/quantum-ai/simulators/__pycache__/noise_model.cpython-312.pyc
new file mode 100644
index 0000000..9ea4d50
Binary files /dev/null and b/quantum-ai/simulators/__pycache__/noise_model.cpython-312.pyc differ
diff --git a/quantum-ai/simulators/__pycache__/quantum_simulator.cpython-312.pyc b/quantum-ai/simulators/__pycache__/quantum_simulator.cpython-312.pyc
new file mode 100644
index 0000000..aa4c7ca
Binary files /dev/null and b/quantum-ai/simulators/__pycache__/quantum_simulator.cpython-312.pyc differ
diff --git a/quantum-ai/simulators/noise_model.py b/quantum-ai/simulators/noise_model.py
new file mode 100644
index 0000000..04b1034
--- /dev/null
+++ b/quantum-ai/simulators/noise_model.py
@@ -0,0 +1,273 @@
+"""Quantum noise model: depolarising, bit-flip, and phase-flip error channels.
+
+Provides :class:`NoiseModel` for simulating realistic quantum error channels
+on state vectors and density matrices.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class NoiseModel:
+    """Simulate quantum noise channels on qubit state vectors.
+
+    Implements three standard error channels:
+
+    * **Depolarising** – replaces the qubit state with the maximally mixed
+      state with probability *p*.
+    * **Bit-flip** – applies Pauli-X with probability *p*.
+    * **Phase-flip** – applies Pauli-Z with probability *p*.
+    * **Amplitude damping** – models energy relaxation (T1 decay).
+
+    Attributes:
+        depolarising_prob: Default depolarising error probability.
+        bit_flip_prob: Default bit-flip error probability.
+        phase_flip_prob: Default phase-flip error probability.
+        amplitude_damping_gamma: Amplitude damping parameter (0 ≤ gamma ≤ 1).
+    """
+
+    _PAULI_X = np.array([[0, 1], [1, 0]], dtype=np.complex128)
+    _PAULI_Y = np.array([[0, -1j], [1j, 0]], dtype=np.complex128)
+    _PAULI_Z = np.array([[1, 0], [0, -1]], dtype=np.complex128)
+    _I = np.eye(2, dtype=np.complex128)
+
+    def __init__(
+        self,
+        depolarising_prob: float = 0.01,
+        bit_flip_prob: float = 0.01,
+        phase_flip_prob: float = 0.01,
+        amplitude_damping_gamma: float = 0.01,
+        seed: int | None = None,
+    ) -> None:
+        """Initialise NoiseModel.
+
+        Args:
+            depolarising_prob: Probability of depolarising error per gate.
+            bit_flip_prob: Probability of bit-flip error per gate.
+            phase_flip_prob: Probability of phase-flip error per gate.
+            amplitude_damping_gamma: Energy relaxation parameter.
+            seed: Random seed.
+        """
+        for name, val in [
+            ("depolarising_prob", depolarising_prob),
+            ("bit_flip_prob", bit_flip_prob),
+            ("phase_flip_prob", phase_flip_prob),
+            ("amplitude_damping_gamma", amplitude_damping_gamma),
+        ]:
+            if not 0 <= val <= 1:
+                raise ValueError(f"{name} must be in [0, 1].")
+
+        self.depolarising_prob = depolarising_prob
+        self.bit_flip_prob = bit_flip_prob
+        self.phase_flip_prob = phase_flip_prob
+        self.amplitude_damping_gamma = amplitude_damping_gamma
+        self._rng = np.random.default_rng(seed)
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _apply_kraus(
+        self,
+        rho: np.ndarray,
+        kraus_ops: list[np.ndarray],
+    ) -> np.ndarray:
+        """Apply a Kraus operator representation to a density matrix.
+
+        Args:
+            rho: Density matrix (2×2 or 2^n × 2^n).
+            kraus_ops: List of Kraus matrices satisfying sum(K†K) = I.
+
+        Returns:
+            Output density matrix.
+        """
+        return sum(K @ rho @ K.conj().T for K in kraus_ops)
+
+    @staticmethod
+    def _pure_to_dm(state: np.ndarray) -> np.ndarray:
+        """Convert a pure state vector to a density matrix.
+
+        Args:
+            state: 1-D complex state vector.
+
+        Returns:
+            Density matrix ρ = |ψ⟩⟨ψ|.
+        """
+        return np.outer(state, state.conj())
+
+    @staticmethod
+    def _dm_to_pure(rho: np.ndarray) -> np.ndarray:
+        """Extract the dominant eigenvector from a density matrix.
+
+        Args:
+            rho: Density matrix.
+
+        Returns:
+            Approximate pure state vector.
+        """
+        eigenvalues, eigenvectors = np.linalg.eigh(rho)
+        return eigenvectors[:, -1]
+
+    # ------------------------------------------------------------------
+    # Public noise channels
+    # ------------------------------------------------------------------
+
+    def depolarising_channel(
+        self,
+        state: Any,
+        prob: float | None = None,
+    ) -> np.ndarray:
+        """Apply the depolarising channel to a single-qubit state.
+
+        The channel maps ρ → (1 - p)ρ + (p/4)(I ρ I + X ρ X + Y ρ Y + Z ρ Z)
+        = (1 - p)ρ + (p/2)I
+
+        Args:
+            state: 1-D state vector or 2×2 density matrix.
+            prob: Error probability; defaults to :attr:`depolarising_prob`.
+
+        Returns:
+            Output density matrix.
+        """
+        p = prob if prob is not None else self.depolarising_prob
+        arr = np.asarray(state, dtype=np.complex128)
+        rho = arr if arr.ndim == 2 else self._pure_to_dm(arr)
+
+        kraus = [
+            np.sqrt(1 - p) * self._I,
+            np.sqrt(p / 3) * self._PAULI_X,
+            np.sqrt(p / 3) * self._PAULI_Y,
+            np.sqrt(p / 3) * self._PAULI_Z,
+        ]
+        return self._apply_kraus(rho, kraus)
+
+    def bit_flip_channel(
+        self,
+        state: Any,
+        prob: float | None = None,
+    ) -> np.ndarray:
+        """Apply the bit-flip channel.
+
+        Maps ρ → (1-p)ρ + p X ρ X
+
+        Args:
+            state: State vector or density matrix.
+            prob: Bit-flip probability; defaults to :attr:`bit_flip_prob`.
+
+        Returns:
+            Output density matrix.
+        """
+        p = prob if prob is not None else self.bit_flip_prob
+        arr = np.asarray(state, dtype=np.complex128)
+        rho = arr if arr.ndim == 2 else self._pure_to_dm(arr)
+        kraus = [np.sqrt(1 - p) * self._I, np.sqrt(p) * self._PAULI_X]
+        return self._apply_kraus(rho, kraus)
+
+    def phase_flip_channel(
+        self,
+        state: Any,
+        prob: float | None = None,
+    ) -> np.ndarray:
+        """Apply the phase-flip channel.
+
+        Maps ρ → (1-p)ρ + p Z ρ Z
+
+        Args:
+            state: State vector or density matrix.
+            prob: Phase-flip probability; defaults to :attr:`phase_flip_prob`.
+
+        Returns:
+            Output density matrix.
+        """
+        p = prob if prob is not None else self.phase_flip_prob
+        arr = np.asarray(state, dtype=np.complex128)
+        rho = arr if arr.ndim == 2 else self._pure_to_dm(arr)
+        kraus = [np.sqrt(1 - p) * self._I, np.sqrt(p) * self._PAULI_Z]
+        return self._apply_kraus(rho, kraus)
+
+    def amplitude_damping_channel(
+        self,
+        state: Any,
+        gamma: float | None = None,
+    ) -> np.ndarray:
+        """Apply the amplitude damping channel (T1 relaxation).
+
+        Kraus operators: K0 = [[1,0],[0,sqrt(1-gamma)]], K1 = [[0,sqrt(gamma)],[0,0]]
+
+        Args:
+            state: State vector or density matrix.
+            gamma: Damping parameter; defaults to :attr:`amplitude_damping_gamma`.
+
+        Returns:
+            Output density matrix.
+        """
+        g = gamma if gamma is not None else self.amplitude_damping_gamma
+        arr = np.asarray(state, dtype=np.complex128)
+        rho = arr if arr.ndim == 2 else self._pure_to_dm(arr)
+
+        K0 = np.array([[1, 0], [0, np.sqrt(1 - g)]], dtype=np.complex128)
+        K1 = np.array([[0, np.sqrt(g)], [0, 0]], dtype=np.complex128)
+        return self._apply_kraus(rho, [K0, K1])
+
+    def apply_noise_to_circuit(
+        self,
+        state_vector: Any,
+        gate_count: int,
+        noise_type: str = "depolarising",
+    ) -> dict[str, Any]:
+        """Apply noise after each gate in a circuit.
+
+        Simulates accumulated noise over a sequence of gates.
+
+        Args:
+            state_vector: Initial state vector of length ``2^n``.
+            gate_count: Number of gates in the circuit.
+            noise_type: ``"depolarising"``, ``"bit_flip"``, or
+                ``"phase_flip"``.
+
+        Returns:
+            Dict with ``final_density_matrix`` (list of lists),
+            ``fidelity_with_ideal`` (float), ``purity`` (float).
+        """
+        arr = np.asarray(state_vector, dtype=np.complex128)
+        ideal_rho = self._pure_to_dm(arr)
+        rho = ideal_rho.copy()
+
+        channel_map = {
+            "depolarising": self.depolarising_channel,
+            "bit_flip": self.bit_flip_channel,
+            "phase_flip": self.phase_flip_channel,
+        }
+        if noise_type not in channel_map:
+            raise ValueError(f"noise_type must be one of {list(channel_map)}")
+
+        channel = channel_map[noise_type]
+
+        if rho.shape == (2, 2):
+            for _ in range(gate_count):
+                rho = channel(rho)
+        else:
+            # Apply noise to each 2x2 sub-block (approximate)
+            n = rho.shape[0]
+            for _ in range(gate_count):
+                p = (self.depolarising_prob + self.bit_flip_prob) / 2
+                rho = (1 - p) * rho + p * np.eye(n, dtype=np.complex128) / n
+
+        fidelity = float(np.real(np.trace(ideal_rho @ rho)))
+        purity = float(np.real(np.trace(rho @ rho)))
+
+        logger.debug(
+            f"Noise circuit: {gate_count} gates, fidelity={fidelity:.4f}, "
+            f"purity={purity:.4f}"
+        )
+        return {
+            "final_density_matrix": rho.tolist(),
+            "fidelity_with_ideal": round(fidelity, 6),
+            "purity": round(purity, 6),
+            "gate_count": gate_count,
+            "noise_type": noise_type,
+        }
diff --git a/quantum-ai/simulators/quantum_simulator.py b/quantum-ai/simulators/quantum_simulator.py
new file mode 100644
index 0000000..1e81c5c
--- /dev/null
+++ b/quantum-ai/simulators/quantum_simulator.py
@@ -0,0 +1,253 @@
+"""Quantum circuit simulator: classical simulation using NumPy state vectors.
+
+Provides :class:`QuantumSimulator` for simulating small quantum circuits via
+exact state-vector evolution.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+# ---------------------------------------------------------------------------
+# Standard single-qubit gate matrices
+# ---------------------------------------------------------------------------
+
+_GATES: dict[str, np.ndarray] = {
+    "I": np.eye(2, dtype=np.complex128),
+    "X": np.array([[0, 1], [1, 0]], dtype=np.complex128),
+    "Y": np.array([[0, -1j], [1j, 0]], dtype=np.complex128),
+    "Z": np.array([[1, 0], [0, -1]], dtype=np.complex128),
+    "H": np.array([[1, 1], [1, -1]], dtype=np.complex128) / np.sqrt(2),
+    "S": np.array([[1, 0], [0, 1j]], dtype=np.complex128),
+    "T": np.array([[1, 0], [0, np.exp(1j * np.pi / 4)]], dtype=np.complex128),
+}
+
+
+class QuantumSimulator:
+    """Classical state-vector quantum circuit simulator.
+
+    Supports an arbitrary number of qubits (up to the memory limits of the
+    host machine) and a standard gate set including Ry, Rz, CNOT, CZ, Toffoli,
+    and SWAP.
+
+    Attributes:
+        n_qubits: Number of qubits in the circuit.
+        state: Current state vector of length ``2^n_qubits``.
+    """
+
+    def __init__(self, n_qubits: int = 4) -> None:
+        """Initialise the simulator in the |0...0⟩ state.
+
+        Args:
+            n_qubits: Number of qubits.
+
+        Raises:
+            ValueError: If n_qubits < 1 or > 20 (memory guard).
+        """
+        if not 1 <= n_qubits <= 20:
+            raise ValueError("n_qubits must be between 1 and 20.")
+        self.n_qubits = n_qubits
+        self.state: np.ndarray = np.zeros(2 ** n_qubits, dtype=np.complex128)
+        self.state[0] = 1.0
+        logger.debug(f"QuantumSimulator: {n_qubits} qubits, dim={2**n_qubits}")
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _apply_single_qubit_gate(
+        self, gate: np.ndarray, target: int
+    ) -> None:
+        """Apply a 2×2 gate to a single qubit via tensor product expansion.
+
+        Args:
+            gate: 2×2 unitary matrix.
+            target: Zero-indexed qubit to apply the gate to.
+        """
+        n = self.n_qubits
+        # Build the full 2^n × 2^n operator using tensored identity
+        ops = [_GATES["I"]] * n
+        ops[target] = gate
+        full = ops[0]
+        for op in ops[1:]:
+            full = np.kron(full, op)
+        self.state = full @ self.state
+
+    def _apply_two_qubit_gate(
+        self, gate: np.ndarray, control: int, target: int
+    ) -> None:
+        """Apply a controlled two-qubit gate.
+
+        Builds the full operator by projecting on control qubit states.
+
+        Args:
+            gate: 4×4 unitary matrix.
+            control: Control qubit index.
+            target: Target qubit index.
+        """
+        n = self.n_qubits
+        dim = 2 ** n
+        full = np.zeros((dim, dim), dtype=np.complex128)
+
+        for i in range(dim):
+            ctrl_bit = (i >> (n - 1 - control)) & 1
+            tgt_bit = (i >> (n - 1 - target)) & 1
+            sub_idx = ctrl_bit * 2 + tgt_bit
+            for j in range(dim):
+                ctrl_bit_j = (j >> (n - 1 - control)) & 1
+                tgt_bit_j = (j >> (n - 1 - target)) & 1
+                # Other qubits must match
+                other_match = True
+                for q in range(n):
+                    if q != control and q != target:
+                        if ((i >> (n - 1 - q)) & 1) != ((j >> (n - 1 - q)) & 1):
+                            other_match = False
+                            break
+                if other_match:
+                    sub_j = ctrl_bit_j * 2 + tgt_bit_j
+                    full[i, j] = gate[sub_idx, sub_j]
+
+        self.state = full @ self.state
+
+    # ------------------------------------------------------------------
+    # Gate operations
+    # ------------------------------------------------------------------
+
+    def h(self, qubit: int) -> "QuantumSimulator":
+        """Apply Hadamard gate.
+
+        Args:
+            qubit: Target qubit index.
+
+        Returns:
+            Self for method chaining.
+        """
+        self._apply_single_qubit_gate(_GATES["H"], qubit)
+        return self
+
+    def x(self, qubit: int) -> "QuantumSimulator":
+        """Apply Pauli-X (NOT) gate.
+
+        Args:
+            qubit: Target qubit index.
+
+        Returns:
+            Self for method chaining.
+        """
+        self._apply_single_qubit_gate(_GATES["X"], qubit)
+        return self
+
+    def ry(self, qubit: int, theta: float) -> "QuantumSimulator":
+        """Apply Ry rotation gate.
+
+        Args:
+            qubit: Target qubit.
+            theta: Rotation angle in radians.
+
+        Returns:
+            Self for method chaining.
+        """
+        gate = np.array([
+            [np.cos(theta / 2), -np.sin(theta / 2)],
+            [np.sin(theta / 2),  np.cos(theta / 2)],
+        ], dtype=np.complex128)
+        self._apply_single_qubit_gate(gate, qubit)
+        return self
+
+    def rz(self, qubit: int, phi: float) -> "QuantumSimulator":
+        """Apply Rz rotation gate.
+
+        Args:
+            qubit: Target qubit.
+            phi: Rotation angle in radians.
+
+        Returns:
+            Self for method chaining.
+        """
+        gate = np.array([
+            [np.exp(-1j * phi / 2), 0],
+            [0, np.exp(1j * phi / 2)],
+        ], dtype=np.complex128)
+        self._apply_single_qubit_gate(gate, qubit)
+        return self
+
+    def cnot(self, control: int, target: int) -> "QuantumSimulator":
+        """Apply CNOT gate.
+
+        Args:
+            control: Control qubit.
+            target: Target qubit.
+
+        Returns:
+            Self for method chaining.
+        """
+        cnot_gate = np.array([
+            [1, 0, 0, 0],
+            [0, 1, 0, 0],
+            [0, 0, 0, 1],
+            [0, 0, 1, 0],
+        ], dtype=np.complex128)
+        self._apply_two_qubit_gate(cnot_gate, control, target)
+        return self
+
+    # ------------------------------------------------------------------
+    # Measurement
+    # ------------------------------------------------------------------
+
+    def measure(
+        self, n_shots: int = 1024, seed: int | None = None
+    ) -> dict[str, Any]:
+        """Simulate projective measurements.
+
+        Args:
+            n_shots: Number of measurement shots.
+            seed: Random seed.
+
+        Returns:
+            Dict with ``counts`` (bitstring → count), ``probabilities``
+            (bitstring → float), ``state_vector`` (complex list).
+        """
+        probs = np.abs(self.state) ** 2
+        probs /= probs.sum()
+
+        rng = np.random.default_rng(seed)
+        outcomes = rng.choice(len(probs), size=n_shots, p=probs)
+
+        counts: dict[str, int] = {}
+        for outcome in outcomes:
+            bitstring = format(outcome, f"0{self.n_qubits}b")
+            counts[bitstring] = counts.get(bitstring, 0) + 1
+
+        prob_dict = {
+            format(i, f"0{self.n_qubits}b"): float(p)
+            for i, p in enumerate(probs)
+            if p > 1e-10
+        }
+
+        return {
+            "counts": counts,
+            "probabilities": prob_dict,
+            "state_vector": self.state.tolist(),
+        }
+
+    def reset(self) -> "QuantumSimulator":
+        """Reset to |0...0⟩ state.
+
+        Returns:
+            Self for method chaining.
+        """
+        self.state = np.zeros(2 ** self.n_qubits, dtype=np.complex128)
+        self.state[0] = 1.0
+        return self
+
+    def statevector(self) -> list[complex]:
+        """Return the current normalised state vector.
+
+        Returns:
+            State vector as a list of complex numbers.
+        """
+        return self.state.tolist()
diff --git a/shared/__init__.py b/shared/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/shared/__pycache__/__init__.cpython-312.pyc b/shared/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..3a6f43f
Binary files /dev/null and b/shared/__pycache__/__init__.cpython-312.pyc differ
diff --git a/shared/common/__init__.py b/shared/common/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/shared/common/__pycache__/__init__.cpython-312.pyc b/shared/common/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..16e0b04
Binary files /dev/null and b/shared/common/__pycache__/__init__.cpython-312.pyc differ
diff --git a/shared/common/__pycache__/config.cpython-312.pyc b/shared/common/__pycache__/config.cpython-312.pyc
new file mode 100644
index 0000000..52a347c
Binary files /dev/null and b/shared/common/__pycache__/config.cpython-312.pyc differ
diff --git a/shared/common/__pycache__/exceptions.cpython-312.pyc b/shared/common/__pycache__/exceptions.cpython-312.pyc
new file mode 100644
index 0000000..baff0a5
Binary files /dev/null and b/shared/common/__pycache__/exceptions.cpython-312.pyc differ
diff --git a/shared/common/__pycache__/logger.cpython-312.pyc b/shared/common/__pycache__/logger.cpython-312.pyc
new file mode 100644
index 0000000..77539f3
Binary files /dev/null and b/shared/common/__pycache__/logger.cpython-312.pyc differ
diff --git a/shared/common/__pycache__/utils.cpython-312.pyc b/shared/common/__pycache__/utils.cpython-312.pyc
new file mode 100644
index 0000000..67c60b0
Binary files /dev/null and b/shared/common/__pycache__/utils.cpython-312.pyc differ
diff --git a/shared/common/config.py b/shared/common/config.py
new file mode 100644
index 0000000..9684ac5
--- /dev/null
+++ b/shared/common/config.py
@@ -0,0 +1,251 @@
+"""Configuration management for the trading platform.
+
+Loads settings from (in ascending priority order):
+
+1. Hard-coded defaults
+2. ``config.yaml`` found relative to the project root (or the path supplied
+   via the ``CONFIG_FILE`` environment variable).
+3. Environment variables with the prefix ``TRADING_``.
+
+Uses *pydantic-settings* so every field is validated and type-coerced at
+startup.  A singleton :func:`get_config` accessor avoids repeated parsing.
+
+Example usage::
+
+    from shared.common.config import get_config
+
+    cfg = get_config()
+    print(cfg.exchange.api_key)
+"""
+
+from __future__ import annotations
+
+import os
+from functools import lru_cache
+from pathlib import Path
+from typing import Any
+
+import yaml
+from pydantic import AnyHttpUrl, Field, SecretStr, field_validator
+from pydantic_settings import BaseSettings, SettingsConfigDict
+
+
+# ---------------------------------------------------------------------------
+# Sub-settings groups
+# ---------------------------------------------------------------------------
+
+
+class DatabaseSettings(BaseSettings):
+    """Relational / time-series database connection settings."""
+
+    model_config = SettingsConfigDict(env_prefix="TRADING_DB_", extra="ignore")
+
+    host: str = Field("localhost", description="Database host.")
+    port: int = Field(5432, ge=1, le=65535, description="Database port.")
+    name: str = Field("trading", description="Database name.")
+    user: str = Field("trading_user", description="Database user.")
+    password: SecretStr = Field(
+        SecretStr("changeme"), description="Database password."
+    )
+    pool_size: int = Field(10, ge=1, le=200, description="Connection pool size.")
+    pool_max_overflow: int = Field(20, ge=0, description="Max pool overflow.")
+
+    @property
+    def dsn(self) -> str:
+        """Return a PostgreSQL DSN string (password not redacted)."""
+        pwd = self.password.get_secret_value()
+        return (
+            f"postgresql+asyncpg://{self.user}:{pwd}"
+            f"@{self.host}:{self.port}/{self.name}"
+        )
+
+
+class RedisSettings(BaseSettings):
+    """Redis cache / pub-sub settings."""
+
+    model_config = SettingsConfigDict(env_prefix="TRADING_REDIS_", extra="ignore")
+
+    host: str = Field("localhost", description="Redis host.")
+    port: int = Field(6379, ge=1, le=65535, description="Redis port.")
+    db: int = Field(0, ge=0, le=15, description="Redis logical database index.")
+    password: SecretStr | None = Field(None, description="Redis password.")
+    max_connections: int = Field(50, ge=1, description="Connection pool size.")
+
+
+class ExchangeSettings(BaseSettings):
+    """Exchange connectivity settings."""
+
+    model_config = SettingsConfigDict(env_prefix="TRADING_EXCHANGE_", extra="ignore")
+
+    name: str = Field("binance", description="Exchange identifier slug.")
+    api_key: SecretStr = Field(
+        SecretStr(""), description="Exchange REST/WebSocket API key."
+    )
+    api_secret: SecretStr = Field(
+        SecretStr(""), description="Exchange API secret."
+    )
+    testnet: bool = Field(True, description="Use the exchange sandbox/testnet.")
+    rest_base_url: AnyHttpUrl = Field(
+        "https://testnet.binance.vision",  # type: ignore[assignment]
+        description="REST API base URL.",
+    )
+    ws_base_url: str = Field(
+        "wss://testnet.binance.vision/ws",
+        description="WebSocket base URL.",
+    )
+    rate_limit_rps: int = Field(
+        10, ge=1, description="Requests per second allowed by the exchange."
+    )
+
+
+class RiskSettings(BaseSettings):
+    """Risk-management parameters."""
+
+    model_config = SettingsConfigDict(env_prefix="TRADING_RISK_", extra="ignore")
+
+    max_position_size_usd: float = Field(
+        100_000.0, gt=0, description="Maximum single-position value in USD."
+    )
+    max_portfolio_drawdown_pct: float = Field(
+        10.0, gt=0, le=100, description="Hard drawdown limit as a percentage."
+    )
+    max_order_size_usd: float = Field(
+        50_000.0, gt=0, description="Maximum single-order value in USD."
+    )
+    daily_loss_limit_usd: float = Field(
+        20_000.0, gt=0, description="Maximum daily realised loss before halt."
+    )
+
+
+class LoggingSettings(BaseSettings):
+    """Logging configuration."""
+
+    model_config = SettingsConfigDict(env_prefix="TRADING_LOG_", extra="ignore")
+
+    level: str = Field("INFO", description="Log level.")
+    log_dir: str | None = Field(None, description="Directory for rotating log files.")
+    rotation: str = Field("100 MB", description="Log rotation trigger.")
+    retention: str = Field("30 days", description="Log retention policy.")
+    serialize: bool = Field(False, description="Emit JSON log lines.")
+
+    @field_validator("level")
+    @classmethod
+    def validate_level(cls, v: str) -> str:
+        """Ensure log level is a valid loguru level."""
+        valid = {"TRACE", "DEBUG", "INFO", "SUCCESS", "WARNING", "ERROR", "CRITICAL"}
+        upper = v.upper()
+        if upper not in valid:
+            raise ValueError(f"Invalid log level {v!r}. Must be one of {valid}.")
+        return upper
+
+
+class AGISettings(BaseSettings):
+    """AGI orchestration settings."""
+
+    model_config = SettingsConfigDict(env_prefix="TRADING_AGI_", extra="ignore")
+
+    enabled: bool = Field(True, description="Enable AGI decision layer.")
+    model_endpoint: str = Field(
+        "http://localhost:8080", description="AGI model inference endpoint."
+    )
+    timeout_seconds: float = Field(5.0, gt=0, description="Inference timeout.")
+    confidence_threshold: float = Field(
+        0.7, ge=0.0, le=1.0, description="Minimum signal confidence to act."
+    )
+
+
+# ---------------------------------------------------------------------------
+# Root settings
+# ---------------------------------------------------------------------------
+
+
+class TradingPlatformSettings(BaseSettings):
+    """Root configuration for the trading platform.
+
+    Environment variables are prefixed with ``TRADING_``.  Nested models read
+    their own prefixes (e.g. ``TRADING_DB_HOST``).
+    """
+
+    model_config = SettingsConfigDict(
+        env_prefix="TRADING_",
+        env_nested_delimiter="__",
+        extra="ignore",
+    )
+
+    environment: str = Field(
+        "development",
+        description="Deployment environment (development | staging | production).",
+    )
+    service_name: str = Field("trading-platform", description="Service identifier.")
+    debug: bool = Field(False, description="Enable debug mode.")
+
+    database: DatabaseSettings = Field(default_factory=DatabaseSettings)
+    redis: RedisSettings = Field(default_factory=RedisSettings)
+    exchange: ExchangeSettings = Field(default_factory=ExchangeSettings)
+    risk: RiskSettings = Field(default_factory=RiskSettings)
+    logging: LoggingSettings = Field(default_factory=LoggingSettings)
+    agi: AGISettings = Field(default_factory=AGISettings)
+
+    @field_validator("environment")
+    @classmethod
+    def validate_environment(cls, v: str) -> str:
+        """Constrain to known deployment tiers."""
+        valid = {"development", "staging", "production"}
+        if v not in valid:
+            raise ValueError(
+                f"Unknown environment {v!r}. Must be one of {valid}."
+            )
+        return v
+
+    @classmethod
+    def from_yaml(cls, path: Path) -> "TradingPlatformSettings":
+        """Build settings from a YAML file, then overlay environment variables.
+
+        Args:
+            path: Absolute or relative path to ``config.yaml``.
+
+        Returns:
+            A fully validated :class:`TradingPlatformSettings` instance.
+
+        Raises:
+            FileNotFoundError: If *path* does not exist.
+            ValueError: If the YAML content fails validation.
+        """
+        if not path.exists():
+            raise FileNotFoundError(f"Config file not found: {path}")
+
+        with path.open("r", encoding="utf-8") as fh:
+            raw: dict[str, Any] = yaml.safe_load(fh) or {}
+
+        return cls(**raw)
+
+
+def _resolve_config_path() -> Path | None:
+    """Locate a config.yaml file using the CONFIG_FILE env var or defaults."""
+    env_path = os.getenv("CONFIG_FILE")
+    if env_path:
+        return Path(env_path)
+
+    # Walk up from cwd looking for config.yaml
+    for candidate in (Path.cwd(), Path.cwd().parent, Path(__file__).parents[3]):
+        p = candidate / "config.yaml"
+        if p.exists():
+            return p
+
+    return None
+
+
+@lru_cache(maxsize=1)
+def get_config() -> TradingPlatformSettings:
+    """Return the singleton platform configuration.
+
+    Loads from YAML (if found) then overlays environment variables.  Cached
+    after first call for the lifetime of the process.
+
+    Returns:
+        The validated :class:`TradingPlatformSettings` instance.
+    """
+    config_path = _resolve_config_path()
+    if config_path:
+        return TradingPlatformSettings.from_yaml(config_path)
+    return TradingPlatformSettings()
diff --git a/shared/common/exceptions.py b/shared/common/exceptions.py
new file mode 100644
index 0000000..ae41d92
--- /dev/null
+++ b/shared/common/exceptions.py
@@ -0,0 +1,212 @@
+"""Custom exception hierarchy for the trading platform.
+
+All platform-specific errors derive from :class:`TradingPlatformError` so
+callers can catch the entire family with a single ``except`` clause.
+
+Hierarchy::
+
+    TradingPlatformError
+    ├── ConfigurationError
+    ├── AGIError
+    │   ├── ModelNotAvailableError
+    │   └── InferenceError
+    ├── TradingError
+    │   ├── OrderError
+    │   │   ├── OrderNotFoundError
+    │   │   ├── OrderRejectedError
+    │   │   └── DuplicateOrderError
+    │   ├── PositionError
+    │   │   └── InsufficientFundsError
+    │   └── RiskLimitError
+    │       ├── MaxDrawdownError
+    │       └── PositionSizeLimitError
+    ├── DataError
+    │   ├── MarketDataError
+    │   │   └── StaleDataError
+    │   └── ValidationError
+    ├── ConnectionError
+    │   ├── BrokerConnectionError
+    │   └── ExchangeConnectionError
+    └── AuthenticationError
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+
+class TradingPlatformError(Exception):
+    """Base class for all trading-platform exceptions.
+
+    Args:
+        message: Human-readable error description.
+        code: Optional machine-readable error code for structured handling.
+        context: Optional mapping of extra diagnostic key-value pairs.
+    """
+
+    def __init__(
+        self,
+        message: str,
+        code: str | None = None,
+        context: dict[str, Any] | None = None,
+    ) -> None:
+        super().__init__(message)
+        self.message = message
+        self.code = code
+        self.context: dict[str, Any] = context or {}
+
+    def __repr__(self) -> str:  # noqa: D105
+        return (
+            f"{type(self).__name__}("
+            f"message={self.message!r}, "
+            f"code={self.code!r}, "
+            f"context={self.context!r})"
+        )
+
+
+# ---------------------------------------------------------------------------
+# Configuration
+# ---------------------------------------------------------------------------
+
+
+class ConfigurationError(TradingPlatformError):
+    """Raised when configuration is missing or invalid."""
+
+
+# ---------------------------------------------------------------------------
+# AGI / ML subsystem
+# ---------------------------------------------------------------------------
+
+
+class AGIError(TradingPlatformError):
+    """Base class for AGI/ML orchestration errors."""
+
+
+class ModelNotAvailableError(AGIError):
+    """Raised when a required model is not loaded or unreachable."""
+
+
+class InferenceError(AGIError):
+    """Raised when model inference fails or returns an unusable result."""
+
+
+# ---------------------------------------------------------------------------
+# Trading subsystem
+# ---------------------------------------------------------------------------
+
+
+class TradingError(TradingPlatformError):
+    """Base class for trading-execution errors."""
+
+
+class OrderError(TradingError):
+    """Base class for order-lifecycle errors."""
+
+
+class OrderNotFoundError(OrderError):
+    """Raised when an order ID cannot be located."""
+
+
+class OrderRejectedError(OrderError):
+    """Raised when an exchange or broker rejects an order.
+
+    Args:
+        order_id: The order identifier that was rejected.
+        reason: Exchange/broker rejection reason string.
+        **kwargs: Forwarded to :class:`TradingPlatformError`.
+    """
+
+    def __init__(self, order_id: str, reason: str, **kwargs: Any) -> None:
+        super().__init__(
+            f"Order {order_id!r} rejected: {reason}",
+            context={"order_id": order_id, "reason": reason},
+            **kwargs,
+        )
+        self.order_id = order_id
+        self.reason = reason
+
+
+class DuplicateOrderError(OrderError):
+    """Raised on an attempt to submit an order with an already-used client ID."""
+
+
+class PositionError(TradingError):
+    """Base class for position-management errors."""
+
+
+class InsufficientFundsError(PositionError):
+    """Raised when available capital is below what an order requires."""
+
+
+class RiskLimitError(TradingError):
+    """Raised when a risk limit is breached."""
+
+
+class MaxDrawdownError(RiskLimitError):
+    """Raised when the portfolio max-drawdown threshold is exceeded."""
+
+
+class PositionSizeLimitError(RiskLimitError):
+    """Raised when a single position would exceed the configured size limit."""
+
+
+# ---------------------------------------------------------------------------
+# Data subsystem
+# ---------------------------------------------------------------------------
+
+
+class DataError(TradingPlatformError):
+    """Base class for data-related errors."""
+
+
+class MarketDataError(DataError):
+    """Raised when market-data retrieval or parsing fails."""
+
+
+class StaleDataError(MarketDataError):
+    """Raised when market data is older than the acceptable staleness threshold."""
+
+
+class ValidationError(DataError):
+    """Raised when a data model fails validation.
+
+    Args:
+        field: The field name that failed validation.
+        value: The offending value.
+        **kwargs: Forwarded to :class:`TradingPlatformError`.
+    """
+
+    def __init__(self, field: str, value: Any, **kwargs: Any) -> None:
+        super().__init__(
+            f"Validation failed for field {field!r}: {value!r}",
+            context={"field": field, "value": value},
+            **kwargs,
+        )
+        self.field = field
+        self.value = value
+
+
+# ---------------------------------------------------------------------------
+# Connectivity
+# ---------------------------------------------------------------------------
+
+
+class ConnectivityError(TradingPlatformError):
+    """Base class for connection / transport errors."""
+
+
+class BrokerConnectionError(ConnectivityError):
+    """Raised when the connection to a broker is lost or unavailable."""
+
+
+class ExchangeConnectionError(ConnectivityError):
+    """Raised when the connection to a crypto/equity exchange fails."""
+
+
+# ---------------------------------------------------------------------------
+# Authentication / authorisation
+# ---------------------------------------------------------------------------
+
+
+class AuthenticationError(TradingPlatformError):
+    """Raised on authentication or API-key verification failures."""
diff --git a/shared/common/logger.py b/shared/common/logger.py
new file mode 100644
index 0000000..e68ea89
--- /dev/null
+++ b/shared/common/logger.py
@@ -0,0 +1,126 @@
+"""Centralized structured logging for the trading platform.
+
+Provides a configured loguru logger with structured output, log rotation,
+context binding, and environment-aware log levels.
+"""
+
+import sys
+from contextvars import ContextVar
+from pathlib import Path
+from typing import Any
+
+from loguru import logger as _logger
+
+# Context variable for request/correlation ID propagation
+_correlation_id: ContextVar[str] = ContextVar("correlation_id", default="")
+
+
+def _correlation_filter(record: dict[str, Any]) -> bool:
+    """Inject correlation ID from context into every log record.
+
+    Args:
+        record: The loguru log record dict.
+
+    Returns:
+        Always True so the record is never filtered out.
+    """
+    record["extra"].setdefault("correlation_id", _correlation_id.get())
+    return True
+
+
+def configure_logger(
+    log_level: str = "INFO",
+    log_dir: str | None = None,
+    rotation: str = "100 MB",
+    retention: str = "30 days",
+    compression: str = "gz",
+    serialize: bool = False,
+) -> None:
+    """Configure the global loguru logger.
+
+    Sets up a stderr sink and, optionally, a rotating file sink.  Both sinks
+    use structured formatting and include the correlation ID from the current
+    async/thread context.
+
+    Args:
+        log_level: Minimum log level (DEBUG, INFO, WARNING, ERROR, CRITICAL).
+        log_dir: Directory for log files.  When *None* no file sink is added.
+        rotation: File-rotation policy accepted by loguru (e.g. ``"100 MB"``).
+        retention: How long old log files are kept (e.g. ``"30 days"``).
+        compression: Compression format for rotated files (``"gz"`` or ``"zip"``).
+        serialize: When *True* each line is emitted as a JSON object.
+    """
+    _logger.remove()
+
+    fmt = (
+        "<green>{time:YYYY-MM-DD HH:mm:ss.SSS}</green> | "
+        "<level>{level: <8}</level> | "
+        "<cyan>{name}</cyan>:<cyan>{function}</cyan>:<cyan>{line}</cyan> | "
+        "<yellow>{extra[correlation_id]}</yellow> - "
+        "<level>{message}</level>"
+    )
+
+    _logger.add(
+        sys.stderr,
+        level=log_level,
+        format=fmt,
+        filter=_correlation_filter,
+        colorize=True,
+        backtrace=True,
+        diagnose=True,
+        serialize=serialize,
+    )
+
+    if log_dir:
+        log_path = Path(log_dir)
+        log_path.mkdir(parents=True, exist_ok=True)
+
+        _logger.add(
+            log_path / "trading_{time:YYYY-MM-DD}.log",
+            level=log_level,
+            format=fmt,
+            filter=_correlation_filter,
+            rotation=rotation,
+            retention=retention,
+            compression=compression,
+            backtrace=True,
+            diagnose=False,
+            serialize=serialize,
+            enqueue=True,  # thread-safe async logging
+        )
+
+
+def set_correlation_id(correlation_id: str) -> None:
+    """Set the correlation ID for the current execution context.
+
+    Args:
+        correlation_id: Unique identifier to attach to all subsequent log lines
+            emitted from the current async task or thread.
+    """
+    _correlation_id.set(correlation_id)
+
+
+def get_logger(name: str, **context: Any):
+    """Return a context-bound logger for a specific module.
+
+    Args:
+        name: Logger name, typically ``__name__`` of the calling module.
+        **context: Arbitrary key-value pairs bound to every record from this
+            logger instance (e.g. ``service="order-manager"``).
+
+    Returns:
+        A loguru logger with the supplied context pre-bound.
+
+    Example::
+
+        log = get_logger(__name__, service="risk-engine")
+        log.info("position evaluated", symbol="BTCUSDT", pnl=1234.56)
+    """
+    return _logger.bind(module=name, **context)
+
+
+# Apply default configuration so the module is usable without explicit setup.
+configure_logger()
+
+# Public re-export for convenience.
+log = _logger
diff --git a/shared/common/utils.py b/shared/common/utils.py
new file mode 100644
index 0000000..fac167a
--- /dev/null
+++ b/shared/common/utils.py
@@ -0,0 +1,374 @@
+"""Common utilities for the trading platform.
+
+Provides:
+
+* :func:`retry` – async/sync exponential-backoff retry decorator.
+* :class:`RateLimiter` – token-bucket async rate limiter.
+* :class:`Timer` – context-manager and decorator stopwatch.
+* Timestamp helpers: :func:`utc_now`, :func:`to_unix_ms`, :func:`from_unix_ms`.
+* Dict helpers: :func:`deep_merge`, :func:`flatten_dict`, :func:`safe_get`.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import functools
+import time
+from collections.abc import Callable, Coroutine
+from datetime import datetime, timezone
+from typing import Any, TypeVar, overload
+
+F = TypeVar("F", bound=Callable[..., Any])
+
+
+# ---------------------------------------------------------------------------
+# Retry decorator
+# ---------------------------------------------------------------------------
+
+
+def retry(
+    *,
+    attempts: int = 3,
+    delay: float = 1.0,
+    backoff: float = 2.0,
+    exceptions: tuple[type[Exception], ...] = (Exception,),
+    on_retry: Callable[[int, Exception], None] | None = None,
+) -> Callable[[F], F]:
+    """Decorator that retries a sync or async callable on failure.
+
+    Uses exponential back-off between attempts.
+
+    Args:
+        attempts: Maximum number of total call attempts (including the first).
+        delay: Initial delay in seconds before the first retry.
+        backoff: Multiplicative factor applied to *delay* after each failure.
+        exceptions: Tuple of exception types that trigger a retry.
+        on_retry: Optional callback invoked with ``(attempt, exception)``
+            before each retry sleep.
+
+    Returns:
+        A decorator that wraps sync or async functions.
+
+    Example::
+
+        @retry(attempts=5, delay=0.5, exceptions=(IOError,))
+        async def fetch_price(symbol: str) -> float:
+            ...
+    """
+
+    def decorator(func: F) -> F:
+        if asyncio.iscoroutinefunction(func):
+
+            @functools.wraps(func)
+            async def async_wrapper(*args: Any, **kwargs: Any) -> Any:
+                current_delay = delay
+                last_exc: Exception | None = None
+                for attempt in range(1, attempts + 1):
+                    try:
+                        return await func(*args, **kwargs)
+                    except exceptions as exc:
+                        last_exc = exc
+                        if attempt == attempts:
+                            break
+                        if on_retry:
+                            on_retry(attempt, exc)
+                        await asyncio.sleep(current_delay)
+                        current_delay *= backoff
+                raise last_exc  # type: ignore[misc]
+
+            return async_wrapper  # type: ignore[return-value]
+
+        @functools.wraps(func)
+        def sync_wrapper(*args: Any, **kwargs: Any) -> Any:
+            current_delay = delay
+            last_exc: Exception | None = None
+            for attempt in range(1, attempts + 1):
+                try:
+                    return func(*args, **kwargs)
+                except exceptions as exc:
+                    last_exc = exc
+                    if attempt == attempts:
+                        break
+                    if on_retry:
+                        on_retry(attempt, exc)
+                    time.sleep(current_delay)
+                    current_delay *= backoff
+            raise last_exc  # type: ignore[misc]
+
+        return sync_wrapper  # type: ignore[return-value]
+
+    return decorator  # type: ignore[return-value]
+
+
+# ---------------------------------------------------------------------------
+# Rate limiter
+# ---------------------------------------------------------------------------
+
+
+class RateLimiter:
+    """Async token-bucket rate limiter.
+
+    Acquires one token per call, blocking until a token is available.
+
+    Args:
+        rate: Tokens replenished per second.
+        capacity: Maximum burst capacity (defaults to *rate*).
+
+    Example::
+
+        limiter = RateLimiter(rate=10)
+        async def fetch():
+            await limiter.acquire()
+            ...
+    """
+
+    def __init__(self, rate: float, capacity: float | None = None) -> None:
+        if rate <= 0:
+            raise ValueError("rate must be positive")
+        self._rate = rate
+        self._capacity = capacity if capacity is not None else rate
+        self._tokens: float = self._capacity
+        self._last_refill: float = time.monotonic()
+        self._lock = asyncio.Lock()
+
+    def _refill(self) -> None:
+        """Add tokens proportional to elapsed time."""
+        now = time.monotonic()
+        elapsed = now - self._last_refill
+        self._tokens = min(
+            self._capacity, self._tokens + elapsed * self._rate
+        )
+        self._last_refill = now
+
+    async def acquire(self, tokens: float = 1.0) -> None:
+        """Wait until *tokens* are available, then consume them.
+
+        Args:
+            tokens: Number of tokens to consume (default 1).
+
+        Raises:
+            ValueError: If *tokens* exceeds bucket capacity.
+        """
+        if tokens > self._capacity:
+            raise ValueError(
+                f"Requested {tokens} tokens exceeds capacity {self._capacity}"
+            )
+        async with self._lock:
+            while True:
+                self._refill()
+                if self._tokens >= tokens:
+                    self._tokens -= tokens
+                    return
+                wait = (tokens - self._tokens) / self._rate
+                await asyncio.sleep(wait)
+
+
+# ---------------------------------------------------------------------------
+# Timer
+# ---------------------------------------------------------------------------
+
+
+class Timer:
+    """Context-manager and decorator stopwatch.
+
+    Args:
+        name: Optional label included in the string representation.
+
+    Example::
+
+        with Timer("order-routing") as t:
+            await route_order(order)
+        print(t.elapsed_ms)  # 42.1
+
+        @Timer("inference")
+        async def run_model(data):
+            ...
+    """
+
+    def __init__(self, name: str = "") -> None:
+        self.name = name
+        self._start: float = 0.0
+        self._end: float = 0.0
+
+    # --- Context-manager protocol ---
+
+    def __enter__(self) -> "Timer":
+        self._start = time.perf_counter()
+        return self
+
+    def __exit__(self, *_: Any) -> None:
+        self._end = time.perf_counter()
+
+    # --- Async context-manager protocol ---
+
+    async def __aenter__(self) -> "Timer":
+        self._start = time.perf_counter()
+        return self
+
+    async def __aexit__(self, *_: Any) -> None:
+        self._end = time.perf_counter()
+
+    # --- Decorator protocol ---
+
+    @overload
+    def __call__(self, func: Callable[..., Coroutine[Any, Any, Any]]) -> Callable[..., Coroutine[Any, Any, Any]]: ...
+
+    @overload
+    def __call__(self, func: Callable[..., Any]) -> Callable[..., Any]: ...
+
+    def __call__(self, func: Any) -> Any:  # noqa: D102
+        if asyncio.iscoroutinefunction(func):
+
+            @functools.wraps(func)
+            async def async_wrapper(*args: Any, **kwargs: Any) -> Any:
+                async with self:
+                    return await func(*args, **kwargs)
+
+            return async_wrapper
+
+        @functools.wraps(func)
+        def sync_wrapper(*args: Any, **kwargs: Any) -> Any:
+            with self:
+                return func(*args, **kwargs)
+
+        return sync_wrapper
+
+    # --- Properties ---
+
+    @property
+    def elapsed(self) -> float:
+        """Elapsed time in seconds."""
+        end = self._end or time.perf_counter()
+        return end - self._start
+
+    @property
+    def elapsed_ms(self) -> float:
+        """Elapsed time in milliseconds."""
+        return self.elapsed * 1_000.0
+
+    def __str__(self) -> str:  # noqa: D105
+        label = f"[{self.name}] " if self.name else ""
+        return f"{label}{self.elapsed_ms:.3f} ms"
+
+    def __repr__(self) -> str:  # noqa: D105
+        return f"Timer(name={self.name!r}, elapsed_ms={self.elapsed_ms:.3f})"
+
+
+# ---------------------------------------------------------------------------
+# Timestamp helpers
+# ---------------------------------------------------------------------------
+
+
+def utc_now() -> datetime:
+    """Return the current UTC datetime with timezone info.
+
+    Returns:
+        Timezone-aware :class:`datetime` in UTC.
+    """
+    return datetime.now(tz=timezone.utc)
+
+
+def to_unix_ms(dt: datetime) -> int:
+    """Convert a :class:`datetime` to a Unix timestamp in milliseconds.
+
+    Args:
+        dt: A timezone-aware or naive datetime (naive treated as UTC).
+
+    Returns:
+        Integer milliseconds since the Unix epoch.
+    """
+    if dt.tzinfo is None:
+        dt = dt.replace(tzinfo=timezone.utc)
+    return int(dt.timestamp() * 1_000)
+
+
+def from_unix_ms(ts_ms: int) -> datetime:
+    """Convert a Unix millisecond timestamp to a UTC :class:`datetime`.
+
+    Args:
+        ts_ms: Milliseconds since the Unix epoch.
+
+    Returns:
+        Timezone-aware :class:`datetime` in UTC.
+    """
+    return datetime.fromtimestamp(ts_ms / 1_000.0, tz=timezone.utc)
+
+
+# ---------------------------------------------------------------------------
+# Dict utilities
+# ---------------------------------------------------------------------------
+
+
+def deep_merge(base: dict[str, Any], override: dict[str, Any]) -> dict[str, Any]:
+    """Recursively merge *override* into a copy of *base*.
+
+    Nested dicts are merged recursively; all other types in *override* win.
+
+    Args:
+        base: The base dictionary.
+        override: Values that overwrite *base*.
+
+    Returns:
+        New merged dictionary (neither input is mutated).
+    """
+    result = dict(base)
+    for key, value in override.items():
+        if key in result and isinstance(result[key], dict) and isinstance(value, dict):
+            result[key] = deep_merge(result[key], value)
+        else:
+            result[key] = value
+    return result
+
+
+def flatten_dict(
+    nested: dict[str, Any],
+    parent_key: str = "",
+    sep: str = ".",
+) -> dict[str, Any]:
+    """Flatten a nested dictionary using dot-separated keys.
+
+    Args:
+        nested: The nested dictionary to flatten.
+        parent_key: Prefix accumulated during recursion.
+        sep: Key separator string.
+
+    Returns:
+        Flat dictionary with compound keys.
+
+    Example::
+
+        flatten_dict({"a": {"b": 1}})  # {"a.b": 1}
+    """
+    items: list[tuple[str, Any]] = []
+    for k, v in nested.items():
+        new_key = f"{parent_key}{sep}{k}" if parent_key else k
+        if isinstance(v, dict):
+            items.extend(flatten_dict(v, new_key, sep).items())
+        else:
+            items.append((new_key, v))
+    return dict(items)
+
+
+def safe_get(data: dict[str, Any], *keys: str, default: Any = None) -> Any:
+    """Safely traverse a nested dict with a sequence of keys.
+
+    Args:
+        data: The dictionary to traverse.
+        *keys: Ordered sequence of keys forming the path.
+        default: Value returned when any key is absent.
+
+    Returns:
+        The nested value, or *default*.
+
+    Example::
+
+        safe_get(cfg, "exchange", "api_key", default="")
+    """
+    current: Any = data
+    for key in keys:
+        if not isinstance(current, dict):
+            return default
+        current = current.get(key, default)
+        if current is default:
+            return default
+    return current
diff --git a/shared/models/__init__.py b/shared/models/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/shared/models/__pycache__/__init__.cpython-312.pyc b/shared/models/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..e0ec3b4
Binary files /dev/null and b/shared/models/__pycache__/__init__.cpython-312.pyc differ
diff --git a/shared/models/__pycache__/ai_models.cpython-312.pyc b/shared/models/__pycache__/ai_models.cpython-312.pyc
new file mode 100644
index 0000000..afe7c66
Binary files /dev/null and b/shared/models/__pycache__/ai_models.cpython-312.pyc differ
diff --git a/shared/models/__pycache__/market_data.cpython-312.pyc b/shared/models/__pycache__/market_data.cpython-312.pyc
new file mode 100644
index 0000000..1d5e9b3
Binary files /dev/null and b/shared/models/__pycache__/market_data.cpython-312.pyc differ
diff --git a/shared/models/__pycache__/trading_models.cpython-312.pyc b/shared/models/__pycache__/trading_models.cpython-312.pyc
new file mode 100644
index 0000000..22d8fdb
Binary files /dev/null and b/shared/models/__pycache__/trading_models.cpython-312.pyc differ
diff --git a/shared/models/ai_models.py b/shared/models/ai_models.py
new file mode 100644
index 0000000..b1133c4
--- /dev/null
+++ b/shared/models/ai_models.py
@@ -0,0 +1,363 @@
+"""Pydantic models for AI/AGI components of the trading platform.
+
+Provides:
+
+* :class:`SignalDirection` – directional signal enum.
+* :class:`SignalStrength` – confidence-band enum.
+* :class:`TradingSignal` – raw signal emitted by a strategy or model.
+* :class:`ModelPrediction` – structured output from an ML model.
+* :class:`RiskAssessment` – risk evaluation for a proposed action.
+* :class:`AGIDecision` – final decision produced by the AGI orchestrator.
+"""
+
+from __future__ import annotations
+
+import uuid
+from datetime import datetime, timezone
+from decimal import Decimal
+from enum import Enum
+from typing import Any
+
+from pydantic import BaseModel, ConfigDict, Field, field_validator, model_validator
+
+
+# ---------------------------------------------------------------------------
+# Enumerations
+# ---------------------------------------------------------------------------
+
+
+class SignalDirection(str, Enum):
+    """Directional bias of a trading signal."""
+
+    LONG = "LONG"
+    SHORT = "SHORT"
+    NEUTRAL = "NEUTRAL"
+    EXIT_LONG = "EXIT_LONG"
+    EXIT_SHORT = "EXIT_SHORT"
+
+
+class SignalStrength(str, Enum):
+    """Qualitative confidence band for a signal."""
+
+    VERY_WEAK = "VERY_WEAK"
+    WEAK = "WEAK"
+    MODERATE = "MODERATE"
+    STRONG = "STRONG"
+    VERY_STRONG = "VERY_STRONG"
+
+    @classmethod
+    def from_confidence(cls, confidence: float) -> "SignalStrength":
+        """Map a [0, 1] confidence score to a :class:`SignalStrength`.
+
+        Args:
+            confidence: Normalised confidence value in [0, 1].
+
+        Returns:
+            Corresponding :class:`SignalStrength` bucket.
+
+        Raises:
+            ValueError: If *confidence* is outside [0, 1].
+        """
+        if not 0.0 <= confidence <= 1.0:
+            raise ValueError(f"confidence must be in [0, 1], got {confidence}")
+        if confidence < 0.2:
+            return cls.VERY_WEAK
+        if confidence < 0.4:
+            return cls.WEAK
+        if confidence < 0.6:
+            return cls.MODERATE
+        if confidence < 0.8:
+            return cls.STRONG
+        return cls.VERY_STRONG
+
+
+class DecisionAction(str, Enum):
+    """Action the AGI orchestrator has decided to take."""
+
+    OPEN_LONG = "OPEN_LONG"
+    OPEN_SHORT = "OPEN_SHORT"
+    CLOSE_LONG = "CLOSE_LONG"
+    CLOSE_SHORT = "CLOSE_SHORT"
+    REDUCE_LONG = "REDUCE_LONG"
+    REDUCE_SHORT = "REDUCE_SHORT"
+    HOLD = "HOLD"
+    HALT = "HALT"   # Emergency halt – close all positions.
+
+
+# ---------------------------------------------------------------------------
+# Shared config
+# ---------------------------------------------------------------------------
+
+
+class _BaseAIModel(BaseModel):
+    model_config = ConfigDict(
+        populate_by_name=True,
+        use_enum_values=False,
+        json_encoders={Decimal: str, datetime: lambda v: v.isoformat()},
+    )
+
+
+# ---------------------------------------------------------------------------
+# TradingSignal
+# ---------------------------------------------------------------------------
+
+
+class TradingSignal(_BaseAIModel):
+    """Raw trading signal emitted by a strategy or sub-model.
+
+    Args:
+        signal_id: Unique signal identifier.
+        symbol: Target instrument symbol.
+        direction: Directional bias of the signal.
+        confidence: Normalised confidence score in [0, 1].
+        strength: Qualitative confidence band derived from *confidence*.
+        price_target: Optional model price target.
+        stop_loss: Optional suggested stop-loss level.
+        take_profit: Optional suggested take-profit level.
+        horizon_seconds: Forecast horizon in seconds.
+        model_id: Identifier of the model or strategy that emitted the signal.
+        features: Key model inputs used to generate the signal.
+        timestamp: Signal generation timestamp (UTC-aware).
+        expires_at: Optional expiry timestamp after which the signal is stale.
+    """
+
+    signal_id: str = Field(default_factory=lambda: str(uuid.uuid4()))
+    symbol: str = Field(..., min_length=1)
+    direction: SignalDirection
+    confidence: float = Field(..., ge=0.0, le=1.0)
+    strength: SignalStrength | None = None
+    price_target: Decimal | None = Field(None, gt=Decimal("0"))
+    stop_loss: Decimal | None = Field(None, gt=Decimal("0"))
+    take_profit: Decimal | None = Field(None, gt=Decimal("0"))
+    horizon_seconds: int = Field(3600, ge=1)
+    model_id: str = Field("unknown")
+    features: dict[str, Any] = Field(default_factory=dict)
+    timestamp: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+    expires_at: datetime | None = None
+
+    @model_validator(mode="after")
+    def _derive_strength(self) -> "TradingSignal":
+        """Auto-populate *strength* from *confidence* if not provided."""
+        if self.strength is None:
+            object.__setattr__(
+                self,
+                "strength",
+                SignalStrength.from_confidence(self.confidence),
+            )
+        return self
+
+    @property
+    def is_expired(self) -> bool:
+        """``True`` when the signal has passed its expiry time."""
+        if self.expires_at is None:
+            return False
+        return datetime.now(tz=timezone.utc) > self.expires_at
+
+    @property
+    def risk_reward_ratio(self) -> Decimal | None:
+        """Risk/reward ratio when both stop-loss and take-profit are set.
+
+        Calculated relative to *price_target* if present, otherwise returns
+        *None* when insufficient data is available.
+        """
+        if self.price_target and self.stop_loss and self.take_profit:
+            risk = abs(self.price_target - self.stop_loss)
+            reward = abs(self.take_profit - self.price_target)
+            if risk == Decimal("0"):
+                return None
+            return reward / risk
+        return None
+
+
+# ---------------------------------------------------------------------------
+# ModelPrediction
+# ---------------------------------------------------------------------------
+
+
+class ModelPrediction(_BaseAIModel):
+    """Structured output from a single ML model inference call.
+
+    Args:
+        prediction_id: Unique prediction identifier.
+        model_id: Model name and optional version (e.g. ``"lstm-v3"``).
+        model_version: Semantic version string of the model.
+        symbol: Target instrument symbol.
+        predicted_return: Expected return over *horizon_seconds* (fraction).
+        predicted_volatility: Expected volatility (annualised fraction).
+        confidence: Model confidence in [0, 1].
+        raw_output: Full model output dict for traceability.
+        feature_importance: Map of feature name → importance score.
+        latency_ms: Model inference latency in milliseconds.
+        timestamp: Inference timestamp (UTC-aware).
+        horizon_seconds: Prediction horizon in seconds.
+    """
+
+    prediction_id: str = Field(default_factory=lambda: str(uuid.uuid4()))
+    model_id: str = Field(..., min_length=1)
+    model_version: str = Field("0.0.0")
+    symbol: str = Field(..., min_length=1)
+    predicted_return: float = Field(
+        ..., description="Expected fractional return over the horizon."
+    )
+    predicted_volatility: float = Field(
+        0.0, ge=0.0, description="Expected annualised volatility."
+    )
+    confidence: float = Field(..., ge=0.0, le=1.0)
+    raw_output: dict[str, Any] = Field(default_factory=dict)
+    feature_importance: dict[str, float] = Field(default_factory=dict)
+    latency_ms: float = Field(0.0, ge=0.0)
+    timestamp: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+    horizon_seconds: int = Field(3600, ge=1)
+
+    @field_validator("feature_importance")
+    @classmethod
+    def _validate_importance_values(
+        cls, v: dict[str, float]
+    ) -> dict[str, float]:
+        """Ensure all importance scores are non-negative."""
+        for name, score in v.items():
+            if score < 0:
+                raise ValueError(
+                    f"Feature importance for {name!r} must be >= 0, got {score}"
+                )
+        return v
+
+    @property
+    def direction(self) -> SignalDirection:
+        """Implied directional signal from the predicted return."""
+        if self.predicted_return > 0:
+            return SignalDirection.LONG
+        if self.predicted_return < 0:
+            return SignalDirection.SHORT
+        return SignalDirection.NEUTRAL
+
+
+# ---------------------------------------------------------------------------
+# RiskAssessment
+# ---------------------------------------------------------------------------
+
+
+class RiskAssessment(_BaseAIModel):
+    """Risk evaluation for a proposed trade or portfolio state.
+
+    Args:
+        assessment_id: Unique assessment identifier.
+        symbol: Instrument being assessed.
+        proposed_quantity: Trade size being evaluated.
+        proposed_notional_usd: Estimated USD notional value.
+        current_drawdown_pct: Portfolio drawdown at time of assessment.
+        position_concentration_pct: Concentration of the symbol in the portfolio.
+        var_1d_pct: 1-day Value-at-Risk as a percentage of portfolio equity.
+        sharpe_estimate: Estimated Sharpe ratio for the proposed trade.
+        is_approved: Whether the risk gate approved the trade.
+        rejection_reasons: Human-readable reasons when *is_approved* is False.
+        risk_score: Composite risk score in [0, 1] (higher = riskier).
+        timestamp: Assessment timestamp (UTC-aware).
+    """
+
+    assessment_id: str = Field(default_factory=lambda: str(uuid.uuid4()))
+    symbol: str = Field(..., min_length=1)
+    proposed_quantity: Decimal = Field(..., gt=Decimal("0"))
+    proposed_notional_usd: Decimal = Field(..., ge=Decimal("0"))
+    current_drawdown_pct: float = Field(0.0, ge=0.0, le=100.0)
+    position_concentration_pct: float = Field(0.0, ge=0.0, le=100.0)
+    var_1d_pct: float = Field(0.0, ge=0.0)
+    sharpe_estimate: float | None = None
+    is_approved: bool = True
+    rejection_reasons: list[str] = Field(default_factory=list)
+    risk_score: float = Field(0.0, ge=0.0, le=1.0)
+    timestamp: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+
+    @model_validator(mode="after")
+    def _sync_approval(self) -> "RiskAssessment":
+        """Mark as rejected when rejection reasons are present."""
+        if self.rejection_reasons and self.is_approved:
+            object.__setattr__(self, "is_approved", False)
+        return self
+
+
+# ---------------------------------------------------------------------------
+# AGIDecision
+# ---------------------------------------------------------------------------
+
+
+class AGIDecision(_BaseAIModel):
+    """Final decision produced by the AGI orchestration layer.
+
+    Aggregates signals, model predictions, and risk assessment into a single
+    actionable decision that can be forwarded to the execution engine.
+
+    Args:
+        decision_id: Unique decision identifier.
+        symbol: Instrument the decision applies to.
+        action: The action the AGI has decided to take.
+        confidence: Aggregate decision confidence in [0, 1].
+        suggested_quantity: Suggested order quantity (None for HOLD/HALT).
+        suggested_price: Optional limit-price recommendation.
+        signals: Input signals that contributed to this decision.
+        predictions: Model predictions considered by the AGI.
+        risk_assessment: Risk gate evaluation for this decision.
+        reasoning: Human-readable explanation of the decision.
+        metadata: Arbitrary extra fields for traceability.
+        timestamp: Decision timestamp (UTC-aware).
+        executed: Whether the decision has been forwarded to execution.
+        execution_order_id: Order ID assigned by the execution engine.
+    """
+
+    decision_id: str = Field(default_factory=lambda: str(uuid.uuid4()))
+    symbol: str = Field(..., min_length=1)
+    action: DecisionAction
+    confidence: float = Field(..., ge=0.0, le=1.0)
+    suggested_quantity: Decimal | None = Field(None, gt=Decimal("0"))
+    suggested_price: Decimal | None = Field(None, gt=Decimal("0"))
+    signals: list[TradingSignal] = Field(default_factory=list)
+    predictions: list[ModelPrediction] = Field(default_factory=list)
+    risk_assessment: RiskAssessment | None = None
+    reasoning: str = ""
+    metadata: dict[str, Any] = Field(default_factory=dict)
+    timestamp: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+    executed: bool = False
+    execution_order_id: str | None = None
+
+    @property
+    def is_actionable(self) -> bool:
+        """``True`` when the decision requires order submission.
+
+        An actionable decision has a non-HOLD/HALT action, a suggested
+        quantity, and an approved risk assessment.
+        """
+        if self.action in {DecisionAction.HOLD, DecisionAction.HALT}:
+            return False
+        if self.suggested_quantity is None:
+            return False
+        if self.risk_assessment and not self.risk_assessment.is_approved:
+            return False
+        return True
+
+    @property
+    def average_signal_confidence(self) -> float:
+        """Mean confidence across all contributing signals."""
+        if not self.signals:
+            return 0.0
+        return sum(s.confidence for s in self.signals) / len(self.signals)
+
+    def mark_executed(self, order_id: str) -> "AGIDecision":
+        """Return a copy of this decision marked as executed.
+
+        Args:
+            order_id: The order ID returned by the execution engine.
+
+        Returns:
+            Updated :class:`AGIDecision` (immutable copy).
+        """
+        return self.model_copy(
+            update={"executed": True, "execution_order_id": order_id}
+        )
diff --git a/shared/models/market_data.py b/shared/models/market_data.py
new file mode 100644
index 0000000..c2414e0
--- /dev/null
+++ b/shared/models/market_data.py
@@ -0,0 +1,299 @@
+"""Pydantic models for market data.
+
+Provides strongly-typed, validated models for:
+
+* :class:`OHLCV` – candlestick / bar data.
+* :class:`Ticker` – best-bid/ask snapshot.
+* :class:`OrderBook` – full depth-of-market snapshot.
+* :class:`Trade` – individual executed trade.
+* :class:`MarketSnapshot` – composite snapshot combining all of the above.
+"""
+
+from __future__ import annotations
+
+from datetime import datetime, timezone
+from decimal import Decimal
+from typing import Annotated
+
+from pydantic import BaseModel, ConfigDict, Field, field_validator, model_validator
+
+
+PositiveDecimal = Annotated[Decimal, Field(gt=Decimal("0"))]
+NonNegativeDecimal = Annotated[Decimal, Field(ge=Decimal("0"))]
+
+
+class _BaseMarketModel(BaseModel):
+    """Shared configuration for all market-data models."""
+
+    model_config = ConfigDict(
+        frozen=True,           # immutable after creation
+        populate_by_name=True,
+        use_enum_values=True,
+        json_encoders={Decimal: str, datetime: lambda v: v.isoformat()},
+    )
+
+
+# ---------------------------------------------------------------------------
+# OHLCV
+# ---------------------------------------------------------------------------
+
+
+class OHLCV(_BaseMarketModel):
+    """Open-High-Low-Close-Volume candlestick bar.
+
+    Args:
+        symbol: Trading pair or instrument symbol (e.g. ``"BTCUSDT"``).
+        open_time: Bar open time (UTC-aware).
+        close_time: Bar close time (UTC-aware).
+        open: Opening price.
+        high: Highest price in the interval.
+        low: Lowest price in the interval.
+        close: Closing price.
+        volume: Base-asset volume traded in the interval.
+        quote_volume: Quote-asset volume traded in the interval.
+        trades: Number of individual trades in the interval.
+        interval: Bar duration string (e.g. ``"1m"``, ``"1h"``).
+    """
+
+    symbol: str = Field(..., min_length=1, description="Trading pair symbol.")
+    open_time: datetime = Field(..., description="Bar open timestamp (UTC).")
+    close_time: datetime = Field(..., description="Bar close timestamp (UTC).")
+    open: PositiveDecimal = Field(..., description="Opening price.")
+    high: PositiveDecimal = Field(..., description="Highest price.")
+    low: PositiveDecimal = Field(..., description="Lowest price.")
+    close: PositiveDecimal = Field(..., description="Closing price.")
+    volume: NonNegativeDecimal = Field(..., description="Base-asset volume.")
+    quote_volume: NonNegativeDecimal = Field(
+        Decimal("0"), description="Quote-asset volume."
+    )
+    trades: int = Field(0, ge=0, description="Number of trades in the bar.")
+    interval: str = Field("1m", description="Bar interval string.")
+
+    @model_validator(mode="after")
+    def _validate_hl(self) -> "OHLCV":
+        """Ensure high >= low and both bound open/close."""
+        if self.high < self.low:
+            raise ValueError(f"high ({self.high}) must be >= low ({self.low})")
+        if self.high < max(self.open, self.close):
+            raise ValueError("high must be >= max(open, close)")
+        if self.low > min(self.open, self.close):
+            raise ValueError("low must be <= min(open, close)")
+        return self
+
+    @field_validator("open_time", "close_time", mode="before")
+    @classmethod
+    def _ensure_utc(cls, v: datetime) -> datetime:
+        """Attach UTC timezone if the datetime is naive."""
+        if isinstance(v, datetime) and v.tzinfo is None:
+            return v.replace(tzinfo=timezone.utc)
+        return v
+
+    @property
+    def midpoint(self) -> Decimal:
+        """Mid-price of high and low."""
+        return (self.high + self.low) / Decimal("2")
+
+    @property
+    def range(self) -> Decimal:
+        """Price range of the bar (high − low)."""
+        return self.high - self.low
+
+
+# ---------------------------------------------------------------------------
+# Ticker
+# ---------------------------------------------------------------------------
+
+
+class Ticker(_BaseMarketModel):
+    """Best bid/ask snapshot for an instrument.
+
+    Args:
+        symbol: Instrument symbol.
+        bid: Best bid price.
+        ask: Best ask price.
+        bid_qty: Quantity available at the best bid.
+        ask_qty: Quantity available at the best ask.
+        last: Last traded price.
+        last_qty: Quantity of the last trade.
+        timestamp: Time of the snapshot (UTC-aware).
+    """
+
+    symbol: str = Field(..., min_length=1)
+    bid: PositiveDecimal
+    ask: PositiveDecimal
+    bid_qty: NonNegativeDecimal = Decimal("0")
+    ask_qty: NonNegativeDecimal = Decimal("0")
+    last: PositiveDecimal | None = None
+    last_qty: NonNegativeDecimal | None = None
+    timestamp: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+
+    @model_validator(mode="after")
+    def _validate_spread(self) -> "Ticker":
+        """Ensure ask >= bid (non-negative spread)."""
+        if self.ask < self.bid:
+            raise ValueError(
+                f"ask ({self.ask}) must be >= bid ({self.bid})"
+            )
+        return self
+
+    @property
+    def spread(self) -> Decimal:
+        """Absolute bid-ask spread."""
+        return self.ask - self.bid
+
+    @property
+    def mid_price(self) -> Decimal:
+        """Mid-price between best bid and ask."""
+        return (self.bid + self.ask) / Decimal("2")
+
+
+# ---------------------------------------------------------------------------
+# Order Book
+# ---------------------------------------------------------------------------
+
+
+class OrderBookLevel(_BaseMarketModel):
+    """A single price-level in the order book.
+
+    Args:
+        price: Price of the level.
+        quantity: Total quantity resting at this price.
+    """
+
+    price: PositiveDecimal
+    quantity: NonNegativeDecimal
+
+
+class OrderBook(_BaseMarketModel):
+    """Full order-book depth snapshot.
+
+    Args:
+        symbol: Instrument symbol.
+        bids: List of bid levels ordered best-to-worst (descending price).
+        asks: List of ask levels ordered best-to-worst (ascending price).
+        timestamp: Snapshot capture time (UTC-aware).
+        last_update_id: Exchange sequence number for this snapshot.
+    """
+
+    symbol: str = Field(..., min_length=1)
+    bids: list[OrderBookLevel] = Field(default_factory=list)
+    asks: list[OrderBookLevel] = Field(default_factory=list)
+    timestamp: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+    last_update_id: int | None = None
+
+    @property
+    def best_bid(self) -> OrderBookLevel | None:
+        """Best (highest) bid level, or *None* if empty."""
+        return self.bids[0] if self.bids else None
+
+    @property
+    def best_ask(self) -> OrderBookLevel | None:
+        """Best (lowest) ask level, or *None* if empty."""
+        return self.asks[0] if self.asks else None
+
+    @property
+    def mid_price(self) -> Decimal | None:
+        """Mid-price, or *None* if either side is empty."""
+        if self.best_bid and self.best_ask:
+            return (self.best_bid.price + self.best_ask.price) / Decimal("2")
+        return None
+
+    def bid_liquidity(self, depth: int = 5) -> Decimal:
+        """Total quantity available in the top *depth* bid levels.
+
+        Args:
+            depth: Number of levels to sum.
+
+        Returns:
+            Total bid quantity.
+        """
+        return sum(
+            (lvl.quantity for lvl in self.bids[:depth]), start=Decimal("0")
+        )
+
+    def ask_liquidity(self, depth: int = 5) -> Decimal:
+        """Total quantity available in the top *depth* ask levels.
+
+        Args:
+            depth: Number of levels to sum.
+
+        Returns:
+            Total ask quantity.
+        """
+        return sum(
+            (lvl.quantity for lvl in self.asks[:depth]), start=Decimal("0")
+        )
+
+
+# ---------------------------------------------------------------------------
+# Trade
+# ---------------------------------------------------------------------------
+
+
+class Trade(_BaseMarketModel):
+    """Single executed trade (tape print).
+
+    Args:
+        trade_id: Exchange-assigned trade identifier.
+        symbol: Instrument symbol.
+        price: Execution price.
+        quantity: Executed quantity.
+        is_buyer_maker: ``True`` when the buy side is the passive (maker) side.
+        timestamp: Trade execution time (UTC-aware).
+        buyer_order_id: Optional buy-side order ID.
+        seller_order_id: Optional sell-side order ID.
+    """
+
+    trade_id: str = Field(..., min_length=1)
+    symbol: str = Field(..., min_length=1)
+    price: PositiveDecimal
+    quantity: PositiveDecimal
+    is_buyer_maker: bool = False
+    timestamp: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+    buyer_order_id: str | None = None
+    seller_order_id: str | None = None
+
+    @property
+    def notional(self) -> Decimal:
+        """Trade notional value (price × quantity)."""
+        return self.price * self.quantity
+
+
+# ---------------------------------------------------------------------------
+# Market Snapshot
+# ---------------------------------------------------------------------------
+
+
+class MarketSnapshot(_BaseMarketModel):
+    """Composite market snapshot combining ticker, book, and recent trades.
+
+    Args:
+        symbol: Instrument symbol.
+        ticker: Current ticker snapshot.
+        order_book: Current order-book depth.
+        recent_trades: Latest trade prints (oldest first).
+        latest_candle: Most recently closed OHLCV bar.
+        timestamp: Snapshot assembly time (UTC-aware).
+    """
+
+    symbol: str = Field(..., min_length=1)
+    ticker: Ticker | None = None
+    order_book: OrderBook | None = None
+    recent_trades: list[Trade] = Field(default_factory=list)
+    latest_candle: OHLCV | None = None
+    timestamp: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+
+    @property
+    def is_complete(self) -> bool:
+        """``True`` when all four data components are present."""
+        return all(
+            [self.ticker, self.order_book, self.recent_trades, self.latest_candle]
+        )
diff --git a/shared/models/trading_models.py b/shared/models/trading_models.py
new file mode 100644
index 0000000..1bf1536
--- /dev/null
+++ b/shared/models/trading_models.py
@@ -0,0 +1,400 @@
+"""Pydantic models for trading operations.
+
+Provides:
+
+* :class:`Side` – BUY / SELL enum.
+* :class:`OrderType` – MARKET, LIMIT, STOP, etc.
+* :class:`OrderStatus` – full order lifecycle states.
+* :class:`TimeInForce` – GTC, IOC, FOK, GTD.
+* :class:`Order` – order request and state model.
+* :class:`Fill` – individual execution / trade fill.
+* :class:`Position` – open position for one instrument.
+* :class:`Portfolio` – aggregate portfolio view.
+"""
+
+from __future__ import annotations
+
+import uuid
+from datetime import datetime, timezone
+from decimal import Decimal
+from enum import Enum
+from typing import Annotated
+
+from pydantic import BaseModel, ConfigDict, Field, model_validator
+
+
+PositiveDecimal = Annotated[Decimal, Field(gt=Decimal("0"))]
+NonNegativeDecimal = Annotated[Decimal, Field(ge=Decimal("0"))]
+
+
+# ---------------------------------------------------------------------------
+# Enumerations
+# ---------------------------------------------------------------------------
+
+
+class Side(str, Enum):
+    """Order side."""
+
+    BUY = "BUY"
+    SELL = "SELL"
+
+    @property
+    def opposite(self) -> "Side":
+        """Return the opposite side."""
+        return Side.SELL if self is Side.BUY else Side.BUY
+
+
+class OrderType(str, Enum):
+    """Order execution type."""
+
+    MARKET = "MARKET"
+    LIMIT = "LIMIT"
+    STOP_MARKET = "STOP_MARKET"
+    STOP_LIMIT = "STOP_LIMIT"
+    TAKE_PROFIT = "TAKE_PROFIT"
+    TAKE_PROFIT_LIMIT = "TAKE_PROFIT_LIMIT"
+    TRAILING_STOP = "TRAILING_STOP"
+
+
+class OrderStatus(str, Enum):
+    """Order lifecycle state."""
+
+    PENDING = "PENDING"          # Created locally, not yet sent to exchange.
+    SUBMITTED = "SUBMITTED"      # Sent to exchange, awaiting acknowledgement.
+    ACCEPTED = "ACCEPTED"        # Acknowledged by exchange.
+    PARTIALLY_FILLED = "PARTIALLY_FILLED"
+    FILLED = "FILLED"
+    CANCELLED = "CANCELLED"
+    REJECTED = "REJECTED"
+    EXPIRED = "EXPIRED"
+
+    @property
+    def is_terminal(self) -> bool:
+        """``True`` for states that cannot transition further."""
+        return self in {
+            OrderStatus.FILLED,
+            OrderStatus.CANCELLED,
+            OrderStatus.REJECTED,
+            OrderStatus.EXPIRED,
+        }
+
+    @property
+    def is_active(self) -> bool:
+        """``True`` when the order is alive on the exchange."""
+        return self in {
+            OrderStatus.SUBMITTED,
+            OrderStatus.ACCEPTED,
+            OrderStatus.PARTIALLY_FILLED,
+        }
+
+
+class TimeInForce(str, Enum):
+    """Order time-in-force policy."""
+
+    GTC = "GTC"   # Good Till Cancelled
+    IOC = "IOC"   # Immediate Or Cancel
+    FOK = "FOK"   # Fill Or Kill
+    GTD = "GTD"   # Good Till Date
+
+
+# ---------------------------------------------------------------------------
+# Shared config
+# ---------------------------------------------------------------------------
+
+
+class _BaseTradeModel(BaseModel):
+    model_config = ConfigDict(
+        populate_by_name=True,
+        use_enum_values=False,
+        json_encoders={Decimal: str, datetime: lambda v: v.isoformat()},
+    )
+
+
+# ---------------------------------------------------------------------------
+# Fill
+# ---------------------------------------------------------------------------
+
+
+class Fill(_BaseTradeModel):
+    """A single execution / trade fill for an order.
+
+    Args:
+        fill_id: Unique fill identifier.
+        order_id: Parent order identifier.
+        symbol: Instrument symbol.
+        side: Execution side.
+        price: Fill execution price.
+        quantity: Fill executed quantity.
+        commission: Commission charged for this fill.
+        commission_asset: Asset used to pay the commission.
+        timestamp: Fill timestamp (UTC-aware).
+        trade_id: Exchange trade identifier.
+    """
+
+    fill_id: str = Field(default_factory=lambda: str(uuid.uuid4()))
+    order_id: str = Field(..., min_length=1)
+    symbol: str = Field(..., min_length=1)
+    side: Side
+    price: PositiveDecimal
+    quantity: PositiveDecimal
+    commission: NonNegativeDecimal = Decimal("0")
+    commission_asset: str = "USDT"
+    timestamp: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+    trade_id: str | None = None
+
+    @property
+    def notional(self) -> Decimal:
+        """Fill notional value (price × quantity)."""
+        return self.price * self.quantity
+
+
+# ---------------------------------------------------------------------------
+# Order
+# ---------------------------------------------------------------------------
+
+
+class Order(_BaseTradeModel):
+    """Represents a trading order through its full lifecycle.
+
+    Args:
+        order_id: Client-generated unique order ID.
+        exchange_order_id: Exchange-assigned order ID (set after acceptance).
+        symbol: Instrument symbol.
+        side: BUY or SELL.
+        order_type: Execution type.
+        quantity: Requested quantity.
+        price: Limit price (required for LIMIT / STOP_LIMIT orders).
+        stop_price: Stop trigger price.
+        time_in_force: Order duration policy.
+        status: Current order lifecycle state.
+        filled_quantity: Cumulative executed quantity.
+        average_fill_price: Volume-weighted average fill price.
+        fills: List of individual fills.
+        created_at: Order creation timestamp.
+        updated_at: Last state-change timestamp.
+        strategy_id: Identifier of the strategy that placed this order.
+        tags: Arbitrary metadata tags.
+    """
+
+    order_id: str = Field(default_factory=lambda: str(uuid.uuid4()))
+    exchange_order_id: str | None = None
+    symbol: str = Field(..., min_length=1)
+    side: Side
+    order_type: OrderType
+    quantity: PositiveDecimal
+    price: PositiveDecimal | None = None
+    stop_price: PositiveDecimal | None = None
+    time_in_force: TimeInForce = TimeInForce.GTC
+    status: OrderStatus = OrderStatus.PENDING
+    filled_quantity: NonNegativeDecimal = Decimal("0")
+    average_fill_price: NonNegativeDecimal | None = None
+    fills: list[Fill] = Field(default_factory=list)
+    created_at: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+    updated_at: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+    strategy_id: str | None = None
+    tags: dict[str, str] = Field(default_factory=dict)
+
+    @model_validator(mode="after")
+    def _validate_price_requirements(self) -> "Order":
+        """Ensure limit/stop orders carry the appropriate price fields."""
+        if self.order_type in {OrderType.LIMIT, OrderType.STOP_LIMIT}:
+            if self.price is None:
+                raise ValueError(
+                    f"{self.order_type.value} orders require a limit price."
+                )
+        if self.order_type in {
+            OrderType.STOP_MARKET,
+            OrderType.STOP_LIMIT,
+            OrderType.TAKE_PROFIT,
+            OrderType.TAKE_PROFIT_LIMIT,
+        }:
+            if self.stop_price is None:
+                raise ValueError(
+                    f"{self.order_type.value} orders require a stop_price."
+                )
+        return self
+
+    @property
+    def remaining_quantity(self) -> Decimal:
+        """Quantity not yet filled."""
+        return self.quantity - self.filled_quantity
+
+    @property
+    def fill_ratio(self) -> Decimal:
+        """Proportion of the order that has been filled (0–1)."""
+        return self.filled_quantity / self.quantity
+
+    @property
+    def is_complete(self) -> bool:
+        """``True`` when the order is in a terminal state."""
+        return self.status.is_terminal
+
+    def apply_fill(self, fill: Fill) -> "Order":
+        """Return a new Order with the fill applied.
+
+        Args:
+            fill: The fill to apply.
+
+        Returns:
+            A new immutable Order instance with updated fill state.
+
+        Raises:
+            ValueError: If the fill would exceed the order quantity.
+        """
+        new_filled = self.filled_quantity + fill.quantity
+        if new_filled > self.quantity:
+            raise ValueError(
+                f"Fill quantity {fill.quantity} would exceed order quantity "
+                f"{self.quantity} (already filled: {self.filled_quantity})"
+            )
+
+        # Compute new VWAP
+        if self.average_fill_price and self.filled_quantity > 0:
+            total_notional = (
+                self.average_fill_price * self.filled_quantity
+                + fill.price * fill.quantity
+            )
+            new_vwap = total_notional / new_filled
+        else:
+            new_vwap = fill.price
+
+        new_status = (
+            OrderStatus.FILLED
+            if new_filled == self.quantity
+            else OrderStatus.PARTIALLY_FILLED
+        )
+
+        return self.model_copy(
+            update={
+                "fills": [*self.fills, fill],
+                "filled_quantity": new_filled,
+                "average_fill_price": new_vwap,
+                "status": new_status,
+                "updated_at": datetime.now(tz=timezone.utc),
+            }
+        )
+
+
+# ---------------------------------------------------------------------------
+# Position
+# ---------------------------------------------------------------------------
+
+
+class Position(_BaseTradeModel):
+    """Open position in a single instrument.
+
+    Args:
+        symbol: Instrument symbol.
+        side: Net position side (BUY = long, SELL = short).
+        quantity: Absolute open quantity.
+        average_entry_price: Volume-weighted average entry price.
+        unrealised_pnl: Mark-to-market unrealised P&L.
+        realised_pnl: Realised P&L from closed sub-positions.
+        notional: Current mark-to-market notional value.
+        opened_at: Position open timestamp.
+        updated_at: Last update timestamp.
+        strategy_id: Identifier of the owning strategy.
+    """
+
+    symbol: str = Field(..., min_length=1)
+    side: Side
+    quantity: PositiveDecimal
+    average_entry_price: PositiveDecimal
+    unrealised_pnl: Decimal = Decimal("0")
+    realised_pnl: Decimal = Decimal("0")
+    notional: NonNegativeDecimal = Decimal("0")
+    opened_at: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+    updated_at: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+    strategy_id: str | None = None
+
+    def mark_to_market(self, mark_price: Decimal) -> "Position":
+        """Return a new Position with unrealised P&L and notional updated.
+
+        Args:
+            mark_price: Current market price used for marking.
+
+        Returns:
+            Updated Position (immutable copy).
+        """
+        notional = mark_price * self.quantity
+        sign = Decimal("1") if self.side is Side.BUY else Decimal("-1")
+        upnl = sign * (mark_price - self.average_entry_price) * self.quantity
+        return self.model_copy(
+            update={
+                "unrealised_pnl": upnl,
+                "notional": notional,
+                "updated_at": datetime.now(tz=timezone.utc),
+            }
+        )
+
+
+# ---------------------------------------------------------------------------
+# Portfolio
+# ---------------------------------------------------------------------------
+
+
+class Portfolio(_BaseTradeModel):
+    """Aggregate portfolio view across all open positions.
+
+    Args:
+        portfolio_id: Unique portfolio identifier.
+        account_id: Owning account / sub-account identifier.
+        positions: Map of symbol → Position.
+        cash_balance: Available cash in quote currency.
+        total_equity: Total equity (cash + mark-to-market position values).
+        total_unrealised_pnl: Sum of unrealised P&L across all positions.
+        total_realised_pnl: Sum of realised P&L across all positions.
+        peak_equity: Highest recorded equity (used for drawdown calculation).
+        updated_at: Last update timestamp.
+    """
+
+    portfolio_id: str = Field(default_factory=lambda: str(uuid.uuid4()))
+    account_id: str = Field(..., min_length=1)
+    positions: dict[str, Position] = Field(default_factory=dict)
+    cash_balance: NonNegativeDecimal = Decimal("0")
+    total_equity: NonNegativeDecimal = Decimal("0")
+    total_unrealised_pnl: Decimal = Decimal("0")
+    total_realised_pnl: Decimal = Decimal("0")
+    peak_equity: NonNegativeDecimal = Decimal("0")
+    updated_at: datetime = Field(
+        default_factory=lambda: datetime.now(tz=timezone.utc)
+    )
+
+    @property
+    def current_drawdown_pct(self) -> Decimal:
+        """Current drawdown from peak equity as a percentage.
+
+        Returns:
+            Drawdown percentage (0 = at peak, 100 = total loss).
+        """
+        if self.peak_equity == Decimal("0"):
+            return Decimal("0")
+        return (
+            (self.peak_equity - self.total_equity) / self.peak_equity * Decimal("100")
+        )
+
+    @property
+    def open_symbol_count(self) -> int:
+        """Number of symbols with open positions."""
+        return len(self.positions)
+
+    def get_position(self, symbol: str) -> Position | None:
+        """Retrieve a position by symbol.
+
+        Args:
+            symbol: Instrument symbol.
+
+        Returns:
+            The position, or *None* if no open position exists.
+        """
+        return self.positions.get(symbol)
diff --git a/shared/proto/agi.proto b/shared/proto/agi.proto
new file mode 100644
index 0000000..50c0ee5
--- /dev/null
+++ b/shared/proto/agi.proto
@@ -0,0 +1,230 @@
+syntax = "proto3";
+
+package agi;
+
+option go_package = "github.com/rag7/trading/proto/agi";
+option java_multiple_files = true;
+option java_package = "com.rag7.trading.proto.agi";
+
+import "google/protobuf/timestamp.proto";
+import "google/protobuf/struct.proto";
+
+// ---------------------------------------------------------------------------
+// Enumerations
+// ---------------------------------------------------------------------------
+
+enum SignalDirection {
+  SIGNAL_DIRECTION_UNSPECIFIED = 0;
+  SIGNAL_DIRECTION_LONG = 1;
+  SIGNAL_DIRECTION_SHORT = 2;
+  SIGNAL_DIRECTION_NEUTRAL = 3;
+  SIGNAL_DIRECTION_EXIT_LONG = 4;
+  SIGNAL_DIRECTION_EXIT_SHORT = 5;
+}
+
+enum SignalStrength {
+  SIGNAL_STRENGTH_UNSPECIFIED = 0;
+  SIGNAL_STRENGTH_VERY_WEAK = 1;
+  SIGNAL_STRENGTH_WEAK = 2;
+  SIGNAL_STRENGTH_MODERATE = 3;
+  SIGNAL_STRENGTH_STRONG = 4;
+  SIGNAL_STRENGTH_VERY_STRONG = 5;
+}
+
+enum DecisionAction {
+  DECISION_ACTION_UNSPECIFIED = 0;
+  DECISION_ACTION_OPEN_LONG = 1;
+  DECISION_ACTION_OPEN_SHORT = 2;
+  DECISION_ACTION_CLOSE_LONG = 3;
+  DECISION_ACTION_CLOSE_SHORT = 4;
+  DECISION_ACTION_REDUCE_LONG = 5;
+  DECISION_ACTION_REDUCE_SHORT = 6;
+  DECISION_ACTION_HOLD = 7;
+  DECISION_ACTION_HALT = 8;
+}
+
+// ---------------------------------------------------------------------------
+// Core messages
+// ---------------------------------------------------------------------------
+
+// Raw signal emitted by a strategy or sub-model.
+message TradingSignal {
+  string signal_id = 1;
+  string symbol = 2;
+  SignalDirection direction = 3;
+  double confidence = 4;
+  SignalStrength strength = 5;
+  string price_target = 6;   // String-encoded decimal.
+  string stop_loss = 7;
+  string take_profit = 8;
+  int32 horizon_seconds = 9;
+  string model_id = 10;
+  // Arbitrary feature key-value pairs for traceability.
+  google.protobuf.Struct features = 11;
+  google.protobuf.Timestamp timestamp = 12;
+  google.protobuf.Timestamp expires_at = 13;
+}
+
+// Prediction output from a single ML model.
+message ModelPrediction {
+  string prediction_id = 1;
+  string model_id = 2;
+  string model_version = 3;
+  string symbol = 4;
+  double predicted_return = 5;
+  double predicted_volatility = 6;
+  double confidence = 7;
+  // Full model output for auditability.
+  google.protobuf.Struct raw_output = 8;
+  // Feature importance scores.
+  map<string, double> feature_importance = 9;
+  double latency_ms = 10;
+  int32 horizon_seconds = 11;
+  google.protobuf.Timestamp timestamp = 12;
+}
+
+// Risk evaluation for a proposed trade.
+message RiskAssessment {
+  string assessment_id = 1;
+  string symbol = 2;
+  string proposed_quantity = 3;       // String-encoded decimal.
+  string proposed_notional_usd = 4;
+  double current_drawdown_pct = 5;
+  double position_concentration_pct = 6;
+  double var_1d_pct = 7;
+  double sharpe_estimate = 8;
+  bool is_approved = 9;
+  repeated string rejection_reasons = 10;
+  double risk_score = 11;
+  google.protobuf.Timestamp timestamp = 12;
+}
+
+// Final decision from the AGI orchestration layer.
+message AGIDecision {
+  string decision_id = 1;
+  string symbol = 2;
+  DecisionAction action = 3;
+  double confidence = 4;
+  string suggested_quantity = 5;  // String-encoded decimal.
+  string suggested_price = 6;
+  repeated TradingSignal signals = 7;
+  repeated ModelPrediction predictions = 8;
+  RiskAssessment risk_assessment = 9;
+  string reasoning = 10;
+  // Arbitrary metadata map for traceability.
+  google.protobuf.Struct metadata = 11;
+  google.protobuf.Timestamp timestamp = 12;
+  bool executed = 13;
+  string execution_order_id = 14;
+}
+
+// ---------------------------------------------------------------------------
+// Request / response messages
+// ---------------------------------------------------------------------------
+
+message GenerateSignalRequest {
+  string symbol = 1;
+  // Serialised market snapshot passed to the model (JSON blob).
+  string market_snapshot_json = 2;
+  // Model parameters override (optional).
+  google.protobuf.Struct params = 3;
+}
+
+message GenerateSignalResponse {
+  TradingSignal signal = 1;
+  string error_message = 2;
+}
+
+message RunInferenceRequest {
+  string model_id = 1;
+  string symbol = 2;
+  // Feature vector as key-value pairs.
+  google.protobuf.Struct features = 3;
+}
+
+message RunInferenceResponse {
+  ModelPrediction prediction = 1;
+  string error_message = 2;
+}
+
+message EvaluateRiskRequest {
+  string symbol = 1;
+  string proposed_quantity = 2;
+  string proposed_notional_usd = 3;
+  // Current portfolio state (JSON blob).
+  string portfolio_json = 4;
+}
+
+message EvaluateRiskResponse {
+  RiskAssessment assessment = 1;
+  string error_message = 2;
+}
+
+message MakeDecisionRequest {
+  string symbol = 1;
+  string market_snapshot_json = 2;
+  string portfolio_json = 3;
+  // Optional caller-supplied signals to merge with AGI signals.
+  repeated TradingSignal override_signals = 4;
+}
+
+message MakeDecisionResponse {
+  AGIDecision decision = 1;
+  string error_message = 2;
+}
+
+message GetModelStatusRequest {
+  string model_id = 1;
+}
+
+message ModelStatus {
+  string model_id = 1;
+  string model_version = 2;
+  bool is_loaded = 3;
+  bool is_healthy = 4;
+  double average_latency_ms = 5;
+  int64 total_inferences = 6;
+  google.protobuf.Timestamp last_inference_at = 7;
+}
+
+message GetModelStatusResponse {
+  repeated ModelStatus models = 1;
+}
+
+// Request for the StreamSignals RPC with optional per-symbol filter.
+message StreamSignalsRequest {
+  // Optional list of symbols to subscribe to. Empty = all symbols.
+  repeated string symbols = 1;
+  // Minimum confidence threshold; signals below this are suppressed.
+  double min_confidence = 2;
+}
+
+// Streamed signal feed pushed to subscribers.
+message SignalStreamUpdate {
+  TradingSignal signal = 1;
+  google.protobuf.Timestamp event_time = 2;
+}
+
+// ---------------------------------------------------------------------------
+// Service definition
+// ---------------------------------------------------------------------------
+
+service AGIService {
+  // Generate a trading signal for a symbol using the AGI signal pipeline.
+  rpc GenerateSignal(GenerateSignalRequest) returns (GenerateSignalResponse);
+
+  // Run a specific model inference.
+  rpc RunInference(RunInferenceRequest) returns (RunInferenceResponse);
+
+  // Evaluate risk for a proposed trade.
+  rpc EvaluateRisk(EvaluateRiskRequest) returns (EvaluateRiskResponse);
+
+  // Produce a full AGI decision combining signals, predictions and risk.
+  rpc MakeDecision(MakeDecisionRequest) returns (MakeDecisionResponse);
+
+  // Query the health and status of loaded models.
+  rpc GetModelStatus(GetModelStatusRequest) returns (GetModelStatusResponse);
+
+  // Server-streaming: subscribe to real-time signal updates for all symbols.
+  rpc StreamSignals(StreamSignalsRequest) returns (stream SignalStreamUpdate);
+}
diff --git a/shared/proto/monitoring.proto b/shared/proto/monitoring.proto
new file mode 100644
index 0000000..f7e3ca2
--- /dev/null
+++ b/shared/proto/monitoring.proto
@@ -0,0 +1,245 @@
+syntax = "proto3";
+
+package monitoring;
+
+option go_package = "github.com/rag7/trading/proto/monitoring";
+option java_multiple_files = true;
+option java_package = "com.rag7.trading.proto.monitoring";
+
+import "google/protobuf/timestamp.proto";
+import "google/protobuf/struct.proto";
+import "google/protobuf/empty.proto";
+
+// ---------------------------------------------------------------------------
+// Enumerations
+// ---------------------------------------------------------------------------
+
+enum HealthStatus {
+  HEALTH_STATUS_UNSPECIFIED = 0;
+  HEALTH_STATUS_HEALTHY = 1;
+  HEALTH_STATUS_DEGRADED = 2;
+  HEALTH_STATUS_UNHEALTHY = 3;
+}
+
+enum AlertSeverity {
+  ALERT_SEVERITY_UNSPECIFIED = 0;
+  ALERT_SEVERITY_INFO = 1;
+  ALERT_SEVERITY_WARNING = 2;
+  ALERT_SEVERITY_ERROR = 3;
+  ALERT_SEVERITY_CRITICAL = 4;
+}
+
+enum MetricType {
+  METRIC_TYPE_UNSPECIFIED = 0;
+  METRIC_TYPE_COUNTER = 1;
+  METRIC_TYPE_GAUGE = 2;
+  METRIC_TYPE_HISTOGRAM = 3;
+  METRIC_TYPE_SUMMARY = 4;
+}
+
+// ---------------------------------------------------------------------------
+// Metric messages
+// ---------------------------------------------------------------------------
+
+// A single time-series sample for a named metric.
+message MetricSample {
+  string name = 1;
+  double value = 2;
+  map<string, string> labels = 3;
+  MetricType type = 4;
+  string unit = 5;
+  google.protobuf.Timestamp timestamp = 6;
+}
+
+// Histogram bucket definition.
+message HistogramBucket {
+  double upper_bound = 1;
+  uint64 count = 2;
+}
+
+// Rich histogram metric with full distribution.
+message HistogramMetric {
+  string name = 1;
+  map<string, string> labels = 2;
+  repeated HistogramBucket buckets = 3;
+  uint64 count = 4;
+  double sum = 5;
+  double mean = 6;
+  double p50 = 7;
+  double p95 = 8;
+  double p99 = 9;
+  google.protobuf.Timestamp timestamp = 10;
+}
+
+// ---------------------------------------------------------------------------
+// Health messages
+// ---------------------------------------------------------------------------
+
+// Health of a single service component.
+message ComponentHealth {
+  string component_name = 1;
+  HealthStatus status = 2;
+  string message = 3;
+  double latency_ms = 4;
+  google.protobuf.Timestamp checked_at = 5;
+  // Arbitrary diagnostic key-value pairs.
+  google.protobuf.Struct details = 6;
+}
+
+// Aggregated health report for a service.
+message ServiceHealth {
+  string service_name = 1;
+  string service_version = 2;
+  HealthStatus overall_status = 3;
+  repeated ComponentHealth components = 4;
+  google.protobuf.Timestamp report_time = 5;
+  // Uptime in seconds since last restart.
+  int64 uptime_seconds = 6;
+}
+
+// ---------------------------------------------------------------------------
+// Alert messages
+// ---------------------------------------------------------------------------
+
+message Alert {
+  string alert_id = 1;
+  string name = 2;
+  AlertSeverity severity = 3;
+  string source_service = 4;
+  string message = 5;
+  // Contextual data associated with the alert.
+  google.protobuf.Struct context = 6;
+  bool is_firing = 7;         // True = active, False = resolved.
+  google.protobuf.Timestamp fired_at = 8;
+  google.protobuf.Timestamp resolved_at = 9;
+  repeated string labels = 10;
+  string runbook_url = 11;
+}
+
+// ---------------------------------------------------------------------------
+// Performance / trading metrics
+// ---------------------------------------------------------------------------
+
+// Snapshot of trading-engine performance metrics.
+message TradingMetrics {
+  string service_name = 1;
+  // Order metrics.
+  int64 orders_submitted_total = 2;
+  int64 orders_filled_total = 3;
+  int64 orders_rejected_total = 4;
+  int64 orders_cancelled_total = 5;
+  // Latency metrics.
+  double order_submission_latency_p50_ms = 6;
+  double order_submission_latency_p99_ms = 7;
+  double fill_latency_p50_ms = 8;
+  double fill_latency_p99_ms = 9;
+  // P&L metrics.
+  double total_realised_pnl_usd = 10;
+  double total_unrealised_pnl_usd = 11;
+  double current_drawdown_pct = 12;
+  double daily_pnl_usd = 13;
+  // Position metrics.
+  int32 open_positions_count = 14;
+  double total_notional_usd = 15;
+  // Throughput.
+  double orders_per_second = 16;
+  double fills_per_second = 17;
+  google.protobuf.Timestamp snapshot_time = 18;
+}
+
+// ---------------------------------------------------------------------------
+// Request / response messages
+// ---------------------------------------------------------------------------
+
+message CheckHealthRequest {
+  // Empty = check all services; populated = check specific service.
+  string service_name = 1;
+}
+
+message CheckHealthResponse {
+  repeated ServiceHealth services = 1;
+  HealthStatus overall_status = 2;
+}
+
+message GetMetricsRequest {
+  string service_name = 1;
+  repeated string metric_names = 2;    // Empty = return all.
+  map<string, string> label_filter = 3;
+  google.protobuf.Timestamp start_time = 4;
+  google.protobuf.Timestamp end_time = 5;
+}
+
+message GetMetricsResponse {
+  repeated MetricSample samples = 1;
+  repeated HistogramMetric histograms = 2;
+  string error_message = 3;
+}
+
+message GetTradingMetricsRequest {
+  string service_name = 1;
+}
+
+message GetTradingMetricsResponse {
+  TradingMetrics metrics = 1;
+  string error_message = 2;
+}
+
+message ListAlertsRequest {
+  bool active_only = 1;          // When true, return only firing alerts.
+  AlertSeverity min_severity = 2;
+  string source_service = 3;     // Optional service filter.
+  int32 limit = 4;
+  string page_token = 5;
+}
+
+message ListAlertsResponse {
+  repeated Alert alerts = 1;
+  string next_page_token = 2;
+  int32 total_count = 3;
+}
+
+message AcknowledgeAlertRequest {
+  string alert_id = 1;
+  string acknowledged_by = 2;
+  string note = 3;
+}
+
+message AcknowledgeAlertResponse {
+  bool success = 1;
+  string error_message = 2;
+}
+
+// Pushed event on the live metrics stream.
+message MetricsStreamEvent {
+  oneof payload {
+    MetricSample sample = 1;
+    Alert alert = 2;
+    ServiceHealth health = 3;
+    TradingMetrics trading_metrics = 4;
+  }
+  google.protobuf.Timestamp event_time = 5;
+}
+
+// ---------------------------------------------------------------------------
+// Service definition
+// ---------------------------------------------------------------------------
+
+service MonitoringService {
+  // Check the health of one or all services.
+  rpc CheckHealth(CheckHealthRequest) returns (CheckHealthResponse);
+
+  // Retrieve time-series metric samples.
+  rpc GetMetrics(GetMetricsRequest) returns (GetMetricsResponse);
+
+  // Retrieve trading-specific performance metrics.
+  rpc GetTradingMetrics(GetTradingMetricsRequest) returns (GetTradingMetricsResponse);
+
+  // List active or historical alerts.
+  rpc ListAlerts(ListAlertsRequest) returns (ListAlertsResponse);
+
+  // Acknowledge a firing alert.
+  rpc AcknowledgeAlert(AcknowledgeAlertRequest) returns (AcknowledgeAlertResponse);
+
+  // Server-streaming: subscribe to a live feed of metrics, alerts and health events.
+  rpc StreamMetrics(google.protobuf.Empty) returns (stream MetricsStreamEvent);
+}
diff --git a/shared/proto/trading.proto b/shared/proto/trading.proto
new file mode 100644
index 0000000..7c2dbb7
--- /dev/null
+++ b/shared/proto/trading.proto
@@ -0,0 +1,229 @@
+syntax = "proto3";
+
+package trading;
+
+option go_package = "github.com/rag7/trading/proto/trading";
+option java_multiple_files = true;
+option java_package = "com.rag7.trading.proto";
+
+import "google/protobuf/timestamp.proto";
+import "google/protobuf/empty.proto";
+
+// ---------------------------------------------------------------------------
+// Enumerations
+// ---------------------------------------------------------------------------
+
+enum OrderSide {
+  ORDER_SIDE_UNSPECIFIED = 0;
+  ORDER_SIDE_BUY = 1;
+  ORDER_SIDE_SELL = 2;
+}
+
+enum OrderType {
+  ORDER_TYPE_UNSPECIFIED = 0;
+  ORDER_TYPE_MARKET = 1;
+  ORDER_TYPE_LIMIT = 2;
+  ORDER_TYPE_STOP_MARKET = 3;
+  ORDER_TYPE_STOP_LIMIT = 4;
+  ORDER_TYPE_TAKE_PROFIT = 5;
+  ORDER_TYPE_TAKE_PROFIT_LIMIT = 6;
+  ORDER_TYPE_TRAILING_STOP = 7;
+}
+
+enum OrderStatus {
+  ORDER_STATUS_UNSPECIFIED = 0;
+  ORDER_STATUS_PENDING = 1;
+  ORDER_STATUS_SUBMITTED = 2;
+  ORDER_STATUS_ACCEPTED = 3;
+  ORDER_STATUS_PARTIALLY_FILLED = 4;
+  ORDER_STATUS_FILLED = 5;
+  ORDER_STATUS_CANCELLED = 6;
+  ORDER_STATUS_REJECTED = 7;
+  ORDER_STATUS_EXPIRED = 8;
+}
+
+enum TimeInForce {
+  TIME_IN_FORCE_UNSPECIFIED = 0;
+  TIME_IN_FORCE_GTC = 1;  // Good Till Cancelled
+  TIME_IN_FORCE_IOC = 2;  // Immediate Or Cancel
+  TIME_IN_FORCE_FOK = 3;  // Fill Or Kill
+  TIME_IN_FORCE_GTD = 4;  // Good Till Date
+}
+
+// ---------------------------------------------------------------------------
+// Core messages
+// ---------------------------------------------------------------------------
+
+// Represents a single order fill / execution.
+message Fill {
+  string fill_id = 1;
+  string order_id = 2;
+  string symbol = 3;
+  OrderSide side = 4;
+  // Prices and quantities are transmitted as string-encoded decimals to
+  // preserve precision across languages.
+  string price = 5;
+  string quantity = 6;
+  string commission = 7;
+  string commission_asset = 8;
+  string trade_id = 9;
+  google.protobuf.Timestamp timestamp = 10;
+}
+
+// Full order state.
+message Order {
+  string order_id = 1;
+  string exchange_order_id = 2;
+  string symbol = 3;
+  OrderSide side = 4;
+  OrderType order_type = 5;
+  string quantity = 6;
+  string price = 7;
+  string stop_price = 8;
+  TimeInForce time_in_force = 9;
+  OrderStatus status = 10;
+  string filled_quantity = 11;
+  string average_fill_price = 12;
+  repeated Fill fills = 13;
+  string strategy_id = 14;
+  map<string, string> tags = 15;
+  google.protobuf.Timestamp created_at = 16;
+  google.protobuf.Timestamp updated_at = 17;
+}
+
+// Open position in a single instrument.
+message Position {
+  string symbol = 1;
+  OrderSide side = 2;
+  string quantity = 3;
+  string average_entry_price = 4;
+  string unrealised_pnl = 5;
+  string realised_pnl = 6;
+  string notional = 7;
+  string strategy_id = 8;
+  google.protobuf.Timestamp opened_at = 9;
+  google.protobuf.Timestamp updated_at = 10;
+}
+
+// Aggregate portfolio snapshot.
+message Portfolio {
+  string portfolio_id = 1;
+  string account_id = 2;
+  map<string, Position> positions = 3;
+  string cash_balance = 4;
+  string total_equity = 5;
+  string total_unrealised_pnl = 6;
+  string total_realised_pnl = 7;
+  string peak_equity = 8;
+  string current_drawdown_pct = 9;
+  google.protobuf.Timestamp updated_at = 10;
+}
+
+// ---------------------------------------------------------------------------
+// Request / response messages
+// ---------------------------------------------------------------------------
+
+message SubmitOrderRequest {
+  string client_request_id = 1;  // Idempotency key.
+  string symbol = 2;
+  OrderSide side = 3;
+  OrderType order_type = 4;
+  string quantity = 5;
+  string price = 6;
+  string stop_price = 7;
+  TimeInForce time_in_force = 8;
+  string strategy_id = 9;
+  map<string, string> tags = 10;
+}
+
+message SubmitOrderResponse {
+  Order order = 1;
+  string error_message = 2;
+}
+
+message CancelOrderRequest {
+  string order_id = 1;
+  string symbol = 2;
+}
+
+message CancelOrderResponse {
+  Order order = 1;
+  bool success = 2;
+  string error_message = 3;
+}
+
+message GetOrderRequest {
+  string order_id = 1;
+}
+
+message GetOrderResponse {
+  Order order = 1;
+  string error_message = 2;
+}
+
+message ListOrdersRequest {
+  string symbol = 1;           // Optional: filter by symbol.
+  OrderStatus status_filter = 2; // Optional: filter by status.
+  string strategy_id = 3;      // Optional: filter by strategy.
+  int32 limit = 4;
+  string page_token = 5;
+}
+
+message ListOrdersResponse {
+  repeated Order orders = 1;
+  string next_page_token = 2;
+  int32 total_count = 3;
+}
+
+message GetPositionRequest {
+  string symbol = 1;
+}
+
+message GetPositionResponse {
+  Position position = 1;
+  string error_message = 2;
+}
+
+message GetPortfolioRequest {
+  string account_id = 1;
+}
+
+message GetPortfolioResponse {
+  Portfolio portfolio = 1;
+  string error_message = 2;
+}
+
+// Streamed order-status update pushed to subscribers.
+message OrderStatusUpdate {
+  Order order = 1;
+  Fill latest_fill = 2;        // Populated when status changed due to fill.
+  string reason = 3;           // Human-readable reason for the status change.
+  google.protobuf.Timestamp event_time = 4;
+}
+
+// ---------------------------------------------------------------------------
+// Service definition
+// ---------------------------------------------------------------------------
+
+service TradingService {
+  // Submit a new order to the exchange.
+  rpc SubmitOrder(SubmitOrderRequest) returns (SubmitOrderResponse);
+
+  // Cancel an existing open order.
+  rpc CancelOrder(CancelOrderRequest) returns (CancelOrderResponse);
+
+  // Retrieve a single order by ID.
+  rpc GetOrder(GetOrderRequest) returns (GetOrderResponse);
+
+  // List orders with optional filters.
+  rpc ListOrders(ListOrdersRequest) returns (ListOrdersResponse);
+
+  // Retrieve the current open position for a symbol.
+  rpc GetPosition(GetPositionRequest) returns (GetPositionResponse);
+
+  // Retrieve the full portfolio snapshot.
+  rpc GetPortfolio(GetPortfolioRequest) returns (GetPortfolioResponse);
+
+  // Server-streaming: subscribe to real-time order status updates.
+  rpc StreamOrderUpdates(google.protobuf.Empty) returns (stream OrderStatusUpdate);
+}
diff --git a/synthetic-ai/__init__.py b/synthetic-ai/__init__.py
new file mode 100644
index 0000000..2b4d1be
--- /dev/null
+++ b/synthetic-ai/__init__.py
@@ -0,0 +1,99 @@
+"""Synthetic AI – market simulation and synthetic data generation module.
+
+Exposes the :class:`SyntheticAI` orchestrator which wires together price
+simulation, scenario generation, backtesting, Monte Carlo analysis, and
+data-validation sub-systems.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+from synthetic_ai.generators.market_simulator import MarketSimulator
+from synthetic_ai.generators.scenario_generator import ScenarioGenerator
+from synthetic_ai.generators.adversarial_generator import AdversarialGenerator
+from synthetic_ai.generators.synthetic_data_forge import SyntheticDataForge
+from synthetic_ai.simulation.backtesting_engine import BacktestingEngine
+from synthetic_ai.simulation.monte_carlo import MonteCarlo
+from synthetic_ai.simulation.agent_simulation import AgentSimulation
+from synthetic_ai.validation.reality_checker import RealityChecker
+from synthetic_ai.validation.distribution_matcher import DistributionMatcher
+
+
+class SyntheticAI:
+    """Top-level orchestrator for synthetic data and market simulation.
+
+    Attributes:
+        simulator: Geometric Brownian Motion price simulator.
+        scenario: Bull / bear / crash scenario generator.
+        adversarial: Edge-case event generator.
+        forge: Training data augmentation engine.
+        backtester: Strategy back-testing engine.
+        monte_carlo: Probabilistic scenario modeller.
+        agents: Multi-agent market simulation.
+        reality_checker: Synthetic-vs-real data validator.
+        distribution_matcher: Statistical distribution validator.
+    """
+
+    def __init__(self, config: dict[str, Any] | None = None) -> None:
+        """Initialise SyntheticAI and all sub-systems.
+
+        Args:
+            config: Optional configuration overrides keyed by sub-system name.
+        """
+        cfg = config or {}
+        logger.info("Initialising SyntheticAI")
+
+        self.simulator = MarketSimulator(**cfg.get("simulator", {}))
+        self.scenario = ScenarioGenerator(**cfg.get("scenario", {}))
+        self.adversarial = AdversarialGenerator(**cfg.get("adversarial", {}))
+        self.forge = SyntheticDataForge(**cfg.get("forge", {}))
+
+        self.backtester = BacktestingEngine(**cfg.get("backtester", {}))
+        self.monte_carlo = MonteCarlo(**cfg.get("monte_carlo", {}))
+        self.agents = AgentSimulation(**cfg.get("agents", {}))
+
+        self.reality_checker = RealityChecker(**cfg.get("reality_checker", {}))
+        self.distribution_matcher = DistributionMatcher(
+            **cfg.get("distribution_matcher", {})
+        )
+
+        logger.info("SyntheticAI initialised successfully")
+
+    def generate_training_dataset(
+        self,
+        n_paths: int = 100,
+        n_steps: int = 252,
+        s0: float = 100.0,
+        mu: float = 0.05,
+        sigma: float = 0.20,
+    ) -> dict[str, np.ndarray]:
+        """Generate a synthetic training dataset of price paths.
+
+        Args:
+            n_paths: Number of independent price paths to simulate.
+            n_steps: Number of time steps per path.
+            s0: Initial asset price.
+            mu: Annual drift (expected return).
+            sigma: Annual volatility.
+
+        Returns:
+            Dict with key ``paths`` containing an array of shape
+            ``(n_paths, n_steps + 1)``.
+        """
+        logger.info(f"Generating training dataset: {n_paths} paths × {n_steps} steps")
+        paths = np.stack(
+            [
+                self.simulator.simulate(
+                    s0=s0, mu=mu, sigma=sigma, n_steps=n_steps, dt=1 / 252
+                )
+                for _ in range(n_paths)
+            ]
+        )
+        return {"paths": paths}
+
+
+__all__ = ["SyntheticAI"]
diff --git a/synthetic-ai/generators/__init__.py b/synthetic-ai/generators/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/synthetic-ai/generators/__pycache__/__init__.cpython-312.pyc b/synthetic-ai/generators/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..c2b1645
Binary files /dev/null and b/synthetic-ai/generators/__pycache__/__init__.cpython-312.pyc differ
diff --git a/synthetic-ai/generators/__pycache__/adversarial_generator.cpython-312.pyc b/synthetic-ai/generators/__pycache__/adversarial_generator.cpython-312.pyc
new file mode 100644
index 0000000..616ac2d
Binary files /dev/null and b/synthetic-ai/generators/__pycache__/adversarial_generator.cpython-312.pyc differ
diff --git a/synthetic-ai/generators/__pycache__/market_simulator.cpython-312.pyc b/synthetic-ai/generators/__pycache__/market_simulator.cpython-312.pyc
new file mode 100644
index 0000000..f8cb71f
Binary files /dev/null and b/synthetic-ai/generators/__pycache__/market_simulator.cpython-312.pyc differ
diff --git a/synthetic-ai/generators/__pycache__/scenario_generator.cpython-312.pyc b/synthetic-ai/generators/__pycache__/scenario_generator.cpython-312.pyc
new file mode 100644
index 0000000..0768a66
Binary files /dev/null and b/synthetic-ai/generators/__pycache__/scenario_generator.cpython-312.pyc differ
diff --git a/synthetic-ai/generators/__pycache__/synthetic_data_forge.cpython-312.pyc b/synthetic-ai/generators/__pycache__/synthetic_data_forge.cpython-312.pyc
new file mode 100644
index 0000000..343d543
Binary files /dev/null and b/synthetic-ai/generators/__pycache__/synthetic_data_forge.cpython-312.pyc differ
diff --git a/synthetic-ai/generators/adversarial_generator.py b/synthetic-ai/generators/adversarial_generator.py
new file mode 100644
index 0000000..25d0be2
--- /dev/null
+++ b/synthetic-ai/generators/adversarial_generator.py
@@ -0,0 +1,252 @@
+"""Adversarial data generation: edge-case and stress-test event simulation.
+
+Provides :class:`AdversarialGenerator` for creating extreme market events such
+as flash crashes, liquidity crises, and gap events for stress testing.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class EdgeEvent:
+    """Parameterises an extreme market event.
+
+    Attributes:
+        name: Event identifier.
+        price_shock: Instantaneous log-price shock.
+        vol_spike_factor: Volatility multiplier during the event.
+        duration_steps: Number of steps the event lasts.
+        recovery_halflife: Steps for mean-reversion after shock.
+    """
+
+    name: str
+    price_shock: float
+    vol_spike_factor: float
+    duration_steps: int
+    recovery_halflife: int
+
+
+_BUILT_IN_EVENTS: dict[str, EdgeEvent] = {
+    "flash_crash": EdgeEvent(
+        "flash_crash",
+        price_shock=-0.10,
+        vol_spike_factor=8.0,
+        duration_steps=5,
+        recovery_halflife=3,
+    ),
+    "liquidity_crisis": EdgeEvent(
+        "liquidity_crisis",
+        price_shock=-0.25,
+        vol_spike_factor=5.0,
+        duration_steps=20,
+        recovery_halflife=15,
+    ),
+    "gap_up": EdgeEvent(
+        "gap_up",
+        price_shock=0.08,
+        vol_spike_factor=2.0,
+        duration_steps=2,
+        recovery_halflife=5,
+    ),
+    "gap_down": EdgeEvent(
+        "gap_down",
+        price_shock=-0.08,
+        vol_spike_factor=2.5,
+        duration_steps=2,
+        recovery_halflife=5,
+    ),
+    "short_squeeze": EdgeEvent(
+        "short_squeeze",
+        price_shock=0.40,
+        vol_spike_factor=6.0,
+        duration_steps=3,
+        recovery_halflife=10,
+    ),
+    "black_swan": EdgeEvent(
+        "black_swan",
+        price_shock=-0.50,
+        vol_spike_factor=15.0,
+        duration_steps=30,
+        recovery_halflife=60,
+    ),
+}
+
+
+class AdversarialGenerator:
+    """Generate adversarial market scenarios for stress testing.
+
+    Injects extreme events (flash crashes, liquidity crises, gap events) into
+    a base GBM price path to create worst-case training/testing data.
+
+    Attributes:
+        seed: Random seed.
+        base_mu: Base drift for background GBM.
+        base_sigma: Base volatility for background GBM.
+    """
+
+    def __init__(
+        self,
+        seed: int | None = None,
+        base_mu: float = 0.0,
+        base_sigma: float = 0.20,
+    ) -> None:
+        """Initialise AdversarialGenerator.
+
+        Args:
+            seed: NumPy random seed.
+            base_mu: Annual drift of the background process.
+            base_sigma: Annual volatility of the background process.
+        """
+        self.base_mu = base_mu
+        self.base_sigma = base_sigma
+        self._rng = np.random.default_rng(seed)
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _gbm_step(self, price: float, mu: float, sigma: float, dt: float) -> float:
+        """Compute one GBM step.
+
+        Args:
+            price: Current price.
+            mu: Annual drift.
+            sigma: Annual volatility.
+            dt: Step size in years.
+
+        Returns:
+            Next price.
+        """
+        z = self._rng.standard_normal()
+        log_ret = (mu - 0.5 * sigma ** 2) * dt + sigma * np.sqrt(dt) * z
+        return float(price * np.exp(log_ret))
+
+    def _apply_event(
+        self,
+        prices: np.ndarray,
+        event: EdgeEvent,
+        inject_at: int,
+        dt: float,
+    ) -> np.ndarray:
+        """Inject an edge event into a price series.
+
+        Args:
+            prices: Existing price array (modified in-place clone).
+            event: Edge event specification.
+            inject_at: Step index at which the event begins.
+            dt: Step size in years.
+
+        Returns:
+            Modified price array.
+        """
+        result = prices.copy()
+        n = len(result)
+
+        # Instant shock
+        if inject_at < n:
+            result[inject_at] *= np.exp(event.price_shock)
+
+        # High-vol drift during event duration
+        event_sigma = self.base_sigma * event.vol_spike_factor
+        for i in range(inject_at + 1, min(inject_at + event.duration_steps + 1, n)):
+            result[i] = self._gbm_step(result[i - 1], self.base_mu, event_sigma, dt)
+
+        # Mean-reversion recovery
+        recovery_end = min(inject_at + event.duration_steps + event.recovery_halflife, n)
+        for i in range(inject_at + event.duration_steps + 1, recovery_end):
+            decay = np.exp(-1.0 / event.recovery_halflife)
+            recovery_sigma = self.base_sigma * (
+                1.0 + (event.vol_spike_factor - 1.0) * decay
+            )
+            result[i] = self._gbm_step(result[i - 1], self.base_mu, recovery_sigma, dt)
+
+        return result
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def generate(
+        self,
+        event_name: str,
+        s0: float = 100.0,
+        n_steps: int = 252,
+        dt: float = 1 / 252,
+        inject_at: int | None = None,
+    ) -> dict[str, Any]:
+        """Generate a price path with an injected edge event.
+
+        Args:
+            event_name: Name of the event (must be in built-in set or
+                registered via :meth:`register_event`).
+            s0: Initial price.
+            n_steps: Total number of steps.
+            dt: Step size in years.
+            inject_at: Step at which the event is injected; defaults to 25% of
+                the way through the path.
+
+        Returns:
+            Dict with keys ``event``, ``prices``, ``returns``,
+            ``inject_at``, ``max_drawdown``.
+
+        Raises:
+            KeyError: If *event_name* is not registered.
+        """
+        if event_name not in _BUILT_IN_EVENTS:
+            raise KeyError(
+                f"Unknown event '{event_name}'. Available: {list(_BUILT_IN_EVENTS)}"
+            )
+
+        event = _BUILT_IN_EVENTS[event_name]
+        step = inject_at if inject_at is not None else n_steps // 4
+
+        # Base GBM path
+        prices = np.empty(n_steps + 1)
+        prices[0] = s0
+        for i in range(1, n_steps + 1):
+            prices[i] = self._gbm_step(prices[i - 1], self.base_mu, self.base_sigma, dt)
+
+        prices = self._apply_event(prices, event, step, dt)
+
+        # Max drawdown from peak
+        cum = prices
+        running_max = np.maximum.accumulate(cum)
+        drawdowns = (cum - running_max) / running_max
+        max_dd = float(np.min(drawdowns))
+
+        returns = list(np.diff(prices) / prices[:-1])
+        logger.debug(
+            f"Adversarial '{event_name}': inject_at={step}, max_dd={max_dd:.2%}"
+        )
+        return {
+            "event": event_name,
+            "prices": prices.tolist(),
+            "returns": returns,
+            "inject_at": step,
+            "max_drawdown": max_dd,
+            "price_shock": event.price_shock,
+        }
+
+    def register_event(self, name: str, event: EdgeEvent) -> None:
+        """Register a custom edge event.
+
+        Args:
+            name: Event identifier.
+            event: :class:`EdgeEvent` specification.
+        """
+        _BUILT_IN_EVENTS[name] = event
+        logger.debug(f"Registered adversarial event: {name}")
+
+    def list_events(self) -> list[str]:
+        """Return names of all registered events.
+
+        Returns:
+            Sorted list of event name strings.
+        """
+        return sorted(_BUILT_IN_EVENTS.keys())
diff --git a/synthetic-ai/generators/market_simulator.py b/synthetic-ai/generators/market_simulator.py
new file mode 100644
index 0000000..f7b8899
--- /dev/null
+++ b/synthetic-ai/generators/market_simulator.py
@@ -0,0 +1,168 @@
+"""Market simulator: Geometric Brownian Motion price path generation.
+
+Provides :class:`MarketSimulator` for simulating realistic equity price paths
+using continuous-time GBM with optional jump-diffusion.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class MarketSimulator:
+    """Simulate asset price paths using Geometric Brownian Motion.
+
+    Implements continuous GBM:
+        ``S(t+dt) = S(t) * exp((mu - 0.5 * sigma^2) * dt + sigma * sqrt(dt) * Z)``
+
+    where *Z* ~ N(0, 1).
+
+    Optionally adds Poisson jump-diffusion for fat-tail modelling.
+
+    Attributes:
+        seed: Optional random seed for reproducibility.
+        use_jumps: Whether to add Poisson jump-diffusion.
+        jump_intensity: Expected number of jumps per year (lambda).
+        jump_mean: Mean log-jump size.
+        jump_std: Standard deviation of log-jump size.
+    """
+
+    def __init__(
+        self,
+        seed: int | None = None,
+        use_jumps: bool = False,
+        jump_intensity: float = 2.0,
+        jump_mean: float = -0.05,
+        jump_std: float = 0.10,
+    ) -> None:
+        """Initialise MarketSimulator.
+
+        Args:
+            seed: NumPy random seed (None for non-deterministic).
+            use_jumps: Enable jump-diffusion component.
+            jump_intensity: Average jumps per year.
+            jump_mean: Mean of log-normal jump size distribution.
+            jump_std: Std-dev of log-normal jump size distribution.
+        """
+        self.seed = seed
+        self.use_jumps = use_jumps
+        self.jump_intensity = jump_intensity
+        self.jump_mean = jump_mean
+        self.jump_std = jump_std
+        self._rng = np.random.default_rng(seed)
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def simulate(
+        self,
+        s0: float = 100.0,
+        mu: float = 0.05,
+        sigma: float = 0.20,
+        n_steps: int = 252,
+        dt: float = 1 / 252,
+    ) -> np.ndarray:
+        """Simulate a single GBM price path.
+
+        Args:
+            s0: Initial asset price.
+            mu: Annual expected return (drift).
+            sigma: Annual volatility.
+            n_steps: Number of time steps.
+            dt: Length of each time step in years (default: 1 trading day).
+
+        Returns:
+            Price path array of length ``n_steps + 1`` (includes initial price).
+
+        Raises:
+            ValueError: If s0, sigma, or n_steps are non-positive.
+        """
+        if s0 <= 0:
+            raise ValueError("s0 must be positive.")
+        if sigma < 0:
+            raise ValueError("sigma must be non-negative.")
+        if n_steps <= 0:
+            raise ValueError("n_steps must be positive.")
+
+        prices = np.empty(n_steps + 1)
+        prices[0] = s0
+
+        z = self._rng.standard_normal(n_steps)
+        drift_term = (mu - 0.5 * sigma ** 2) * dt
+        diffusion_term = sigma * np.sqrt(dt) * z
+
+        log_returns = drift_term + diffusion_term
+
+        if self.use_jumps:
+            # Poisson number of jumps per step
+            n_jumps = self._rng.poisson(self.jump_intensity * dt, n_steps)
+            for i, nj in enumerate(n_jumps):
+                if nj > 0:
+                    jump_sizes = self._rng.normal(self.jump_mean, self.jump_std, nj)
+                    log_returns[i] += np.sum(jump_sizes)
+
+        for i in range(n_steps):
+            prices[i + 1] = prices[i] * np.exp(log_returns[i])
+
+        return prices
+
+    def simulate_correlated(
+        self,
+        n_assets: int,
+        correlation_matrix: Any,
+        s0_vector: Any | None = None,
+        mu_vector: Any | None = None,
+        sigma_vector: Any | None = None,
+        n_steps: int = 252,
+        dt: float = 1 / 252,
+    ) -> np.ndarray:
+        """Simulate multiple correlated GBM price paths.
+
+        Uses Cholesky decomposition to impose cross-asset correlations.
+
+        Args:
+            n_assets: Number of assets.
+            correlation_matrix: Array-like of shape ``(n_assets, n_assets)``.
+            s0_vector: Initial prices; defaults to all 100.
+            mu_vector: Annual drifts; defaults to all 0.05.
+            sigma_vector: Annual vols; defaults to all 0.20.
+            n_steps: Number of time steps.
+            dt: Step size in years.
+
+        Returns:
+            Price array of shape ``(n_assets, n_steps + 1)``.
+
+        Raises:
+            ValueError: If correlation matrix is not positive semi-definite.
+        """
+        corr = np.asarray(correlation_matrix, dtype=np.float64)
+        if corr.shape != (n_assets, n_assets):
+            raise ValueError("correlation_matrix shape must be (n_assets, n_assets).")
+
+        s0 = np.asarray(s0_vector or np.full(n_assets, 100.0), dtype=float)
+        mu = np.asarray(mu_vector or np.full(n_assets, 0.05), dtype=float)
+        sigma = np.asarray(sigma_vector or np.full(n_assets, 0.20), dtype=float)
+
+        try:
+            chol = np.linalg.cholesky(corr)
+        except np.linalg.LinAlgError as exc:
+            raise ValueError("correlation_matrix is not positive definite.") from exc
+
+        prices = np.empty((n_assets, n_steps + 1))
+        prices[:, 0] = s0
+
+        z_indep = self._rng.standard_normal((n_assets, n_steps))
+        z_corr = chol @ z_indep
+
+        for i in range(n_steps):
+            log_ret = (mu - 0.5 * sigma ** 2) * dt + sigma * np.sqrt(dt) * z_corr[:, i]
+            prices[:, i + 1] = prices[:, i] * np.exp(log_ret)
+
+        logger.debug(
+            f"Simulated {n_assets} correlated paths over {n_steps} steps"
+        )
+        return prices
diff --git a/synthetic-ai/generators/scenario_generator.py b/synthetic-ai/generators/scenario_generator.py
new file mode 100644
index 0000000..009129e
--- /dev/null
+++ b/synthetic-ai/generators/scenario_generator.py
@@ -0,0 +1,196 @@
+"""Scenario generation: bull, bear, crash, and rally market scenarios.
+
+Provides :class:`ScenarioGenerator` for creating plausible what-if market
+scenarios by modifying drift and volatility of a base price series.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+try:
+    from synthetic_ai.generators.market_simulator import MarketSimulator
+except ImportError:
+    from generators.market_simulator import MarketSimulator
+
+
+@dataclass
+class Scenario:
+    """Describes a named market scenario.
+
+    Attributes:
+        name: Scenario label (e.g., ``"bear"``).
+        drift_multiplier: Multiplier applied to the base drift.
+        volatility_multiplier: Multiplier applied to the base volatility.
+        shock: Optional one-time log-price shock applied at *shock_step*.
+        shock_step: Index (0-based) at which the shock is applied.
+        description: Human-readable description.
+    """
+
+    name: str
+    drift_multiplier: float
+    volatility_multiplier: float
+    shock: float = 0.0
+    shock_step: int | None = None
+    description: str = ""
+
+
+_BUILT_IN_SCENARIOS: dict[str, Scenario] = {
+    "bull": Scenario(
+        "bull", drift_multiplier=2.5, volatility_multiplier=0.8,
+        description="Sustained upward trend with compressed volatility",
+    ),
+    "bear": Scenario(
+        "bear", drift_multiplier=-1.5, volatility_multiplier=1.4,
+        description="Sustained downward trend with elevated volatility",
+    ),
+    "crash": Scenario(
+        "crash", drift_multiplier=-3.0, volatility_multiplier=3.0,
+        shock=-0.20, shock_step=10,
+        description="Sudden 20% gap-down followed by high-volatility recovery",
+    ),
+    "rally": Scenario(
+        "rally", drift_multiplier=4.0, volatility_multiplier=1.2,
+        shock=0.10, shock_step=5,
+        description="10% gap-up followed by continued bullish momentum",
+    ),
+    "sideways": Scenario(
+        "sideways", drift_multiplier=0.0, volatility_multiplier=0.6,
+        description="Range-bound low-volatility consolidation",
+    ),
+    "high_vol": Scenario(
+        "high_vol", drift_multiplier=0.5, volatility_multiplier=3.5,
+        description="Elevated volatility with muted directional trend",
+    ),
+}
+
+
+class ScenarioGenerator:
+    """Generate what-if market scenarios from a base set of parameters.
+
+    Attributes:
+        simulator: Underlying :class:`MarketSimulator` instance.
+        custom_scenarios: User-defined scenarios merged with built-ins.
+    """
+
+    def __init__(
+        self,
+        seed: int | None = None,
+        custom_scenarios: dict[str, dict[str, Any]] | None = None,
+    ) -> None:
+        """Initialise ScenarioGenerator.
+
+        Args:
+            seed: Random seed for reproducibility.
+            custom_scenarios: Additional scenarios to register.  Each key is a
+                scenario name and the value a dict of :class:`Scenario` fields.
+        """
+        self.simulator = MarketSimulator(seed=seed)
+        self.custom_scenarios: dict[str, Scenario] = {**_BUILT_IN_SCENARIOS}
+        if custom_scenarios:
+            for name, cfg in custom_scenarios.items():
+                self.custom_scenarios[name] = Scenario(name=name, **cfg)
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def generate(
+        self,
+        scenario_name: str,
+        s0: float = 100.0,
+        base_mu: float = 0.05,
+        base_sigma: float = 0.20,
+        n_steps: int = 252,
+        dt: float = 1 / 252,
+    ) -> dict[str, Any]:
+        """Generate a single named scenario price path.
+
+        Args:
+            scenario_name: Name of the scenario (must be in
+                :attr:`custom_scenarios`).
+            s0: Initial price.
+            base_mu: Base annual drift.
+            base_sigma: Base annual volatility.
+            n_steps: Number of time steps.
+            dt: Step size in years.
+
+        Returns:
+            Dict with keys ``scenario``, ``prices`` (list), ``returns`` (list),
+            ``final_price``, ``total_return``.
+
+        Raises:
+            KeyError: If *scenario_name* is not registered.
+        """
+        if scenario_name not in self.custom_scenarios:
+            raise KeyError(
+                f"Unknown scenario '{scenario_name}'. "
+                f"Available: {list(self.custom_scenarios)}"
+            )
+
+        sc = self.custom_scenarios[scenario_name]
+        adj_mu = base_mu * sc.drift_multiplier
+        adj_sigma = base_sigma * sc.volatility_multiplier
+
+        prices = self.simulator.simulate(
+            s0=s0, mu=adj_mu, sigma=adj_sigma, n_steps=n_steps, dt=dt
+        )
+
+        # Apply one-time shock
+        if sc.shock != 0.0 and sc.shock_step is not None:
+            step = min(sc.shock_step, n_steps)
+            prices[step:] *= np.exp(sc.shock)
+
+        returns = list(np.diff(prices) / prices[:-1])
+        total_return = float((prices[-1] / prices[0]) - 1.0)
+
+        logger.debug(
+            f"Scenario '{scenario_name}': total_return={total_return:.2%}, "
+            f"final_price={prices[-1]:.2f}"
+        )
+        return {
+            "scenario": scenario_name,
+            "prices": prices.tolist(),
+            "returns": returns,
+            "final_price": float(prices[-1]),
+            "total_return": total_return,
+            "description": sc.description,
+        }
+
+    def generate_all(
+        self,
+        s0: float = 100.0,
+        base_mu: float = 0.05,
+        base_sigma: float = 0.20,
+        n_steps: int = 252,
+    ) -> dict[str, Any]:
+        """Generate all registered scenarios.
+
+        Args:
+            s0: Initial price.
+            base_mu: Base annual drift.
+            base_sigma: Base annual volatility.
+            n_steps: Number of steps.
+
+        Returns:
+            Dict mapping scenario names to their result dicts.
+        """
+        return {
+            name: self.generate(name, s0, base_mu, base_sigma, n_steps)
+            for name in self.custom_scenarios
+        }
+
+    def list_scenarios(self) -> list[dict[str, str]]:
+        """List all available scenario names and descriptions.
+
+        Returns:
+            List of dicts with ``name`` and ``description`` keys.
+        """
+        return [
+            {"name": sc.name, "description": sc.description}
+            for sc in self.custom_scenarios.values()
+        ]
diff --git a/synthetic-ai/generators/synthetic_data_forge.py b/synthetic-ai/generators/synthetic_data_forge.py
new file mode 100644
index 0000000..978c2f9
--- /dev/null
+++ b/synthetic-ai/generators/synthetic_data_forge.py
@@ -0,0 +1,182 @@
+"""Synthetic data forge: training data augmentation for financial time series.
+
+Provides :class:`SyntheticDataForge` which augments price series using noise
+injection, time warping, window slicing, and magnitude scaling techniques.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class SyntheticDataForge:
+    """Augment financial time series to create additional training samples.
+
+    Implements four augmentation primitives:
+
+    * **Noise injection** – add Gaussian noise scaled to series volatility.
+    * **Time warping** – non-uniform time axis compression / expansion.
+    * **Window slicing** – extract random sub-windows and rescale.
+    * **Magnitude scaling** – globally scale the series by a random factor.
+
+    Attributes:
+        seed: Random seed for reproducibility.
+        noise_scale: Fraction of series std-dev used for noise injection.
+        warp_knots: Number of interpolation knots for time warping.
+        scale_range: ``(min_factor, max_factor)`` for magnitude scaling.
+    """
+
+    def __init__(
+        self,
+        seed: int | None = None,
+        noise_scale: float = 0.05,
+        warp_knots: int = 4,
+        scale_range: tuple[float, float] = (0.8, 1.2),
+    ) -> None:
+        """Initialise SyntheticDataForge.
+
+        Args:
+            seed: NumPy random seed.
+            noise_scale: Noise amplitude as a multiple of the series std-dev.
+            warp_knots: Number of internal knot points for time warping.
+            scale_range: Min and max scaling factors for magnitude scaling.
+        """
+        self.noise_scale = noise_scale
+        self.warp_knots = warp_knots
+        self.scale_range = scale_range
+        self._rng = np.random.default_rng(seed)
+
+    # ------------------------------------------------------------------
+    # Augmentation primitives
+    # ------------------------------------------------------------------
+
+    def inject_noise(self, series: Any) -> np.ndarray:
+        """Add Gaussian noise to a price series.
+
+        Args:
+            series: 1-D array-like of price values.
+
+        Returns:
+            Augmented series with noise added.
+        """
+        arr = np.asarray(series, dtype=np.float64)
+        std = float(np.std(arr)) if len(arr) > 1 else 1.0
+        noise = self._rng.normal(0, self.noise_scale * std, size=arr.shape)
+        return arr + noise
+
+    def time_warp(self, series: Any) -> np.ndarray:
+        """Apply non-uniform time axis compression / expansion.
+
+        Generates a smooth random warp function using piecewise linear
+        interpolation, then resamples the original series.
+
+        Args:
+            series: 1-D array-like price series.
+
+        Returns:
+            Time-warped series of the same length.
+        """
+        arr = np.asarray(series, dtype=np.float64)
+        n = len(arr)
+        if n < 4:
+            return arr.copy()
+
+        # Random warp magnitudes at knot points
+        knot_x = np.linspace(0, n - 1, self.warp_knots + 2)
+        knot_y = knot_x + self._rng.uniform(-n * 0.1, n * 0.1, size=len(knot_x))
+        knot_y[0] = 0.0
+        knot_y[-1] = n - 1
+        knot_y = np.clip(knot_y, 0, n - 1)
+        knot_y = np.sort(knot_y)
+
+        # Interpolate warp function at all integer indices
+        warp_indices = np.interp(np.arange(n), knot_x, knot_y)
+        return np.interp(warp_indices, np.arange(n), arr)
+
+    def window_slice(self, series: Any, window_fraction: float = 0.9) -> np.ndarray:
+        """Extract a random sub-window and rescale back to original length.
+
+        Args:
+            series: 1-D array-like price series.
+            window_fraction: Fraction of series to include in the slice
+                (0 < f < 1).
+
+        Returns:
+            Sliced and resampled series of the original length.
+
+        Raises:
+            ValueError: If window_fraction is outside (0, 1).
+        """
+        if not 0 < window_fraction < 1:
+            raise ValueError("window_fraction must be in (0, 1).")
+        arr = np.asarray(series, dtype=np.float64)
+        n = len(arr)
+        window_size = max(2, int(n * window_fraction))
+        start = int(self._rng.integers(0, n - window_size + 1))
+        sliced = arr[start: start + window_size]
+        return np.interp(np.linspace(0, len(sliced) - 1, n), np.arange(len(sliced)), sliced)
+
+    def magnitude_scale(self, series: Any) -> np.ndarray:
+        """Globally scale a series by a random factor.
+
+        Args:
+            series: 1-D array-like price series.
+
+        Returns:
+            Scaled series.
+        """
+        arr = np.asarray(series, dtype=np.float64)
+        factor = self._rng.uniform(*self.scale_range)
+        return arr * factor
+
+    # ------------------------------------------------------------------
+    # High-level augmentation
+    # ------------------------------------------------------------------
+
+    def augment(
+        self,
+        series: Any,
+        n_samples: int = 10,
+        methods: list[str] | None = None,
+    ) -> list[np.ndarray]:
+        """Generate multiple augmented versions of a series.
+
+        Args:
+            series: Base price series.
+            n_samples: Number of augmented samples to generate.
+            methods: List of method names to apply (in order) per sample.
+                Defaults to all four methods.
+
+        Returns:
+            List of *n_samples* augmented NumPy arrays.
+
+        Raises:
+            ValueError: If an unknown method name is provided.
+        """
+        available = {
+            "noise": self.inject_noise,
+            "warp": self.time_warp,
+            "slice": self.window_slice,
+            "scale": self.magnitude_scale,
+        }
+        chosen = methods or list(available.keys())
+        for m in chosen:
+            if m not in available:
+                raise ValueError(f"Unknown augmentation method '{m}'. Options: {list(available)}")
+
+        arr = np.asarray(series, dtype=np.float64)
+        samples: list[np.ndarray] = []
+        for _ in range(n_samples):
+            augmented = arr.copy()
+            # Randomly apply a random subset of the chosen methods
+            k = int(self._rng.integers(1, len(chosen) + 1))
+            selected = self._rng.choice(chosen, size=k, replace=False)
+            for method_name in selected:
+                augmented = available[method_name](augmented)
+            samples.append(augmented)
+
+        logger.debug(f"Augmented {n_samples} samples using methods: {chosen}")
+        return samples
diff --git a/synthetic-ai/simulation/__init__.py b/synthetic-ai/simulation/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/synthetic-ai/simulation/__pycache__/__init__.cpython-312.pyc b/synthetic-ai/simulation/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..3e9a093
Binary files /dev/null and b/synthetic-ai/simulation/__pycache__/__init__.cpython-312.pyc differ
diff --git a/synthetic-ai/simulation/__pycache__/agent_simulation.cpython-312.pyc b/synthetic-ai/simulation/__pycache__/agent_simulation.cpython-312.pyc
new file mode 100644
index 0000000..e6afeda
Binary files /dev/null and b/synthetic-ai/simulation/__pycache__/agent_simulation.cpython-312.pyc differ
diff --git a/synthetic-ai/simulation/__pycache__/backtesting_engine.cpython-312.pyc b/synthetic-ai/simulation/__pycache__/backtesting_engine.cpython-312.pyc
new file mode 100644
index 0000000..a0d7e2e
Binary files /dev/null and b/synthetic-ai/simulation/__pycache__/backtesting_engine.cpython-312.pyc differ
diff --git a/synthetic-ai/simulation/__pycache__/monte_carlo.cpython-312.pyc b/synthetic-ai/simulation/__pycache__/monte_carlo.cpython-312.pyc
new file mode 100644
index 0000000..e0b7a97
Binary files /dev/null and b/synthetic-ai/simulation/__pycache__/monte_carlo.cpython-312.pyc differ
diff --git a/synthetic-ai/simulation/agent_simulation.py b/synthetic-ai/simulation/agent_simulation.py
new file mode 100644
index 0000000..c7d685d
--- /dev/null
+++ b/synthetic-ai/simulation/agent_simulation.py
@@ -0,0 +1,238 @@
+"""Multi-agent market simulation: market makers and trend followers.
+
+Provides :class:`AgentSimulation` for simulating price discovery through
+heterogeneous agent interactions.
+"""
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class Agent:
+    """Base class representing a market participant.
+
+    Attributes:
+        agent_id: Unique agent identifier.
+        cash: Current cash balance.
+        inventory: Current position (shares held).
+        agent_type: ``"market_maker"``, ``"trend_follower"``, or
+            ``"noise_trader"``.
+    """
+
+    agent_id: str
+    cash: float
+    inventory: float
+    agent_type: str
+    params: dict[str, Any] = field(default_factory=dict)
+
+
+class AgentSimulation:
+    """Simulate a multi-agent market with heterogeneous trading strategies.
+
+    Agents interact through a simple limit-order book clearing mechanism.
+    Three agent types are supported:
+
+    * **Market maker** – quotes bid/ask around fundamental value; earns spread.
+    * **Trend follower** – trades in the direction of recent price momentum.
+    * **Noise trader** – submits random orders to add realistic microstructure
+      noise.
+
+    Attributes:
+        n_market_makers: Number of market maker agents.
+        n_trend_followers: Number of trend follower agents.
+        n_noise_traders: Number of noise trader agents.
+        tick_size: Minimum price increment.
+        initial_price: Starting mid-price.
+        seed: Random seed.
+    """
+
+    def __init__(
+        self,
+        n_market_makers: int = 3,
+        n_trend_followers: int = 10,
+        n_noise_traders: int = 20,
+        tick_size: float = 0.01,
+        initial_price: float = 100.0,
+        seed: int | None = None,
+    ) -> None:
+        """Initialise AgentSimulation.
+
+        Args:
+            n_market_makers: Market maker count.
+            n_trend_followers: Trend follower count.
+            n_noise_traders: Noise trader count.
+            tick_size: Minimum price step.
+            initial_price: Initial equilibrium price.
+            seed: NumPy random seed.
+        """
+        self.tick_size = tick_size
+        self.initial_price = initial_price
+        self._rng = np.random.default_rng(seed)
+        self._agents: list[Agent] = []
+        self._price_history: list[float] = [initial_price]
+        self._volume_history: list[float] = [0.0]
+
+        # Initialise agents
+        for i in range(n_market_makers):
+            self._agents.append(Agent(
+                f"mm_{i}", cash=500_000.0, inventory=0.0, agent_type="market_maker",
+                params={"spread_fraction": 0.002, "max_inventory": 1000.0},
+            ))
+        for i in range(n_trend_followers):
+            self._agents.append(Agent(
+                f"tf_{i}", cash=200_000.0, inventory=0.0, agent_type="trend_follower",
+                params={"lookback": int(self._rng.integers(5, 30)),
+                        "strength": float(self._rng.uniform(0.5, 2.0))},
+            ))
+        for i in range(n_noise_traders):
+            self._agents.append(Agent(
+                f"nt_{i}", cash=100_000.0, inventory=0.0, agent_type="noise_trader",
+                params={"order_std": 10.0},
+            ))
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _market_maker_order(
+        self, agent: Agent, mid_price: float
+    ) -> tuple[float, float]:
+        """Generate market-maker bid/ask and net order.
+
+        Market makers post symmetric quotes and earn the spread.
+
+        Args:
+            agent: Market maker agent.
+            mid_price: Current mid-price.
+
+        Returns:
+            Tuple of (signed_order_size, price_impact).
+        """
+        spread = mid_price * agent.params["spread_fraction"]
+        inventory_skew = -agent.inventory / (agent.params["max_inventory"] + 1e-9)
+        target = inventory_skew * spread
+        order_size = float(self._rng.normal(target, 5.0))
+        price_impact = spread * 0.1 * np.sign(order_size)
+        return order_size, float(price_impact)
+
+    def _trend_follower_order(
+        self, agent: Agent, price_history: list[float]
+    ) -> tuple[float, float]:
+        """Generate trend-follower order based on momentum signal.
+
+        Args:
+            agent: Trend follower agent.
+            price_history: Full price history.
+
+        Returns:
+            Tuple of (signed_order_size, price_impact).
+        """
+        lookback = agent.params["lookback"]
+        if len(price_history) < lookback + 1:
+            return 0.0, 0.0
+
+        recent = price_history[-lookback:]
+        momentum = (recent[-1] - recent[0]) / (recent[0] + 1e-9)
+        order_size = momentum * agent.params["strength"] * 100.0
+        price_impact = abs(order_size) * 0.0001 * np.sign(order_size)
+        return float(order_size), float(price_impact)
+
+    def _noise_trader_order(self, agent: Agent) -> tuple[float, float]:
+        """Generate random noise trader order.
+
+        Args:
+            agent: Noise trader agent.
+
+        Returns:
+            Tuple of (signed_order_size, price_impact).
+        """
+        order_size = float(self._rng.normal(0, agent.params["order_std"]))
+        price_impact = abs(order_size) * 0.00005 * np.sign(order_size)
+        return order_size, float(price_impact)
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def run(self, n_steps: int = 252) -> dict[str, Any]:
+        """Run the multi-agent market simulation.
+
+        Args:
+            n_steps: Number of simulation steps (e.g., trading days).
+
+        Returns:
+            Dict with keys ``prices`` (list), ``volumes`` (list),
+            ``agent_pnl`` (dict of agent_id → float),
+            ``market_stats`` (dict of summary statistics).
+        """
+        logger.info(
+            f"Starting agent simulation: {len(self._agents)} agents, {n_steps} steps"
+        )
+        prices = self._price_history.copy()
+        volumes = self._volume_history.copy()
+
+        for step in range(n_steps):
+            mid = prices[-1]
+            total_impact = 0.0
+            total_volume = 0.0
+
+            for agent in self._agents:
+                if agent.agent_type == "market_maker":
+                    order, impact = self._market_maker_order(agent, mid)
+                elif agent.agent_type == "trend_follower":
+                    order, impact = self._trend_follower_order(agent, prices)
+                else:
+                    order, impact = self._noise_trader_order(agent)
+
+                fill_price = mid + impact
+                fill_price = max(self.tick_size, fill_price)
+                trade_value = abs(order) * fill_price
+
+                if agent.cash >= trade_value or order < 0:
+                    agent.inventory += order
+                    agent.cash -= order * fill_price
+                    total_impact += impact * abs(order) / (abs(order) + 1e-9)
+                    total_volume += abs(order)
+
+            # New price = mid + volume-weighted average impact + mean-reversion noise
+            noise = float(self._rng.normal(0, mid * 0.001))
+            new_price = max(self.tick_size, mid + total_impact * 0.01 + noise)
+            prices.append(round(new_price, 4))
+            volumes.append(round(total_volume, 2))
+
+        # Compute agent PnL at final price
+        final_price = prices[-1]
+        agent_pnl = {
+            a.agent_id: round(a.cash + a.inventory * final_price - (
+                200_000.0 if a.agent_type == "trend_follower" else
+                (100_000.0 if a.agent_type == "noise_trader" else 500_000.0)
+            ), 2)
+            for a in self._agents
+        }
+
+        price_arr = np.array(prices[1:])
+        returns = np.diff(price_arr) / price_arr[:-1]
+        market_stats = {
+            "final_price": final_price,
+            "total_return": float((prices[-1] / prices[0]) - 1.0),
+            "volatility": float(np.std(returns, ddof=1)) * np.sqrt(252) if len(returns) > 1 else 0.0,
+            "avg_daily_volume": float(np.mean(volumes[1:])),
+            "n_agents": len(self._agents),
+        }
+
+        logger.info(
+            f"Simulation complete: final_price={final_price:.2f}, "
+            f"vol={market_stats['volatility']:.2%}"
+        )
+        return {
+            "prices": prices,
+            "volumes": volumes,
+            "agent_pnl": agent_pnl,
+            "market_stats": market_stats,
+        }
diff --git a/synthetic-ai/simulation/backtesting_engine.py b/synthetic-ai/simulation/backtesting_engine.py
new file mode 100644
index 0000000..5ce74a1
--- /dev/null
+++ b/synthetic-ai/simulation/backtesting_engine.py
@@ -0,0 +1,177 @@
+"""Back-testing engine: strategy evaluation on historical data.
+
+Provides :class:`BacktestingEngine` for running vectorised and event-driven
+back-tests with full performance analytics.
+"""
+
+from __future__ import annotations
+
+from typing import Any, Callable
+
+import numpy as np
+from loguru import logger
+
+
+class BacktestingEngine:
+    """Back-test a trading strategy against historical price data.
+
+    Supports both vectorised strategies (functions that return signal arrays)
+    and per-bar callback strategies.  Computes Sharpe, Sortino, max drawdown,
+    Calmar ratio, win rate, and profit factor.
+
+    Attributes:
+        initial_capital: Starting portfolio value in currency units.
+        commission_bps: Round-trip transaction cost in basis points.
+        annualisation_factor: Trading periods per year.
+        risk_free_rate: Annual risk-free rate for Sharpe/Sortino calculation.
+    """
+
+    def __init__(
+        self,
+        initial_capital: float = 100_000.0,
+        commission_bps: float = 2.0,
+        annualisation_factor: int = 252,
+        risk_free_rate: float = 0.02,
+    ) -> None:
+        """Initialise BacktestingEngine.
+
+        Args:
+            initial_capital: Starting capital.
+            commission_bps: Round-trip commission in basis points.
+            annualisation_factor: Periods per year for annualisation.
+            risk_free_rate: Annual risk-free rate.
+        """
+        self.initial_capital = initial_capital
+        self.commission_bps = commission_bps
+        self.annualisation_factor = annualisation_factor
+        self.risk_free_rate = risk_free_rate
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _compute_metrics(
+        self, returns: np.ndarray, equity_curve: np.ndarray
+    ) -> dict[str, float]:
+        """Compute strategy performance metrics.
+
+        Args:
+            returns: Period return array.
+            equity_curve: Cumulative portfolio value array.
+
+        Returns:
+            Metrics dict.
+        """
+        ann_factor = self.annualisation_factor
+        rf_period = self.risk_free_rate / ann_factor
+
+        excess = returns - rf_period
+        ann_return = float(np.mean(returns)) * ann_factor
+        ann_vol = float(np.std(returns, ddof=1)) * np.sqrt(ann_factor) if len(returns) > 1 else 0.0
+        sharpe = (ann_return - self.risk_free_rate) / ann_vol if ann_vol > 0 else 0.0
+
+        downside = returns[returns < rf_period] - rf_period
+        downside_dev = float(np.std(downside, ddof=1)) * np.sqrt(ann_factor) if len(downside) > 1 else 0.0
+        sortino = (ann_return - self.risk_free_rate) / downside_dev if downside_dev > 0 else 0.0
+
+        peak = np.maximum.accumulate(equity_curve)
+        dd = (equity_curve - peak) / (peak + 1e-9)
+        max_dd = float(np.min(dd))
+        calmar = ann_return / abs(max_dd) if max_dd != 0 else 0.0
+
+        winning_trades = returns[returns > 0]
+        losing_trades = returns[returns < 0]
+        win_rate = len(winning_trades) / len(returns) if len(returns) > 0 else 0.0
+        profit_factor = (
+            float(np.sum(winning_trades)) / abs(float(np.sum(losing_trades)))
+            if len(losing_trades) > 0 and np.sum(losing_trades) != 0
+            else float("inf")
+        )
+
+        total_return = float((equity_curve[-1] / equity_curve[0]) - 1.0) if len(equity_curve) > 1 else 0.0
+
+        return {
+            "total_return": total_return,
+            "annualised_return": ann_return,
+            "annualised_volatility": ann_vol,
+            "sharpe_ratio": sharpe,
+            "sortino_ratio": sortino,
+            "max_drawdown": max_dd,
+            "calmar_ratio": calmar,
+            "win_rate": win_rate,
+            "profit_factor": profit_factor,
+        }
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def run_vectorised(
+        self,
+        prices: Any,
+        signal_fn: Callable[[np.ndarray], np.ndarray],
+    ) -> dict[str, Any]:
+        """Run a vectorised back-test.
+
+        The strategy is encoded as a function that maps a price array to a
+        signal array where +1 = long, -1 = short, 0 = flat.
+
+        Args:
+            prices: Array-like of close prices.
+            signal_fn: Callable that takes a 1-D price array and returns a
+                same-length signal array with values in {-1, 0, 1}.
+
+        Returns:
+            Dict with keys ``equity_curve`` (list), ``returns`` (list),
+            ``metrics`` (dict), ``trades`` (int).
+
+        Raises:
+            ValueError: If prices array is too short.
+        """
+        price_arr = np.asarray(prices, dtype=np.float64)
+        if len(price_arr) < 2:
+            raise ValueError("prices must have at least 2 elements.")
+
+        signals = np.asarray(signal_fn(price_arr), dtype=np.float64)
+        if len(signals) != len(price_arr):
+            raise ValueError("signal_fn must return array same length as prices.")
+
+        # Strategy returns: signal[t] applied to next-period price change
+        price_returns = np.diff(price_arr) / price_arr[:-1]
+        strategy_returns = signals[:-1] * price_returns
+
+        # Commission: charged on position changes
+        position_changes = np.diff(np.concatenate([[0], signals[:-1]]))
+        commission = np.abs(position_changes) * (self.commission_bps / 10_000)
+        net_returns = strategy_returns - commission
+
+        equity = np.empty(len(net_returns) + 1)
+        equity[0] = self.initial_capital
+        for i, r in enumerate(net_returns):
+            equity[i + 1] = equity[i] * (1 + r)
+
+        n_trades = int(np.sum(np.abs(position_changes) > 0))
+        metrics = self._compute_metrics(net_returns, equity)
+
+        logger.info(
+            f"Backtest complete: {n_trades} trades, "
+            f"Sharpe={metrics['sharpe_ratio']:.2f}, "
+            f"MaxDD={metrics['max_drawdown']:.2%}"
+        )
+        return {
+            "equity_curve": equity.tolist(),
+            "returns": net_returns.tolist(),
+            "metrics": metrics,
+            "trades": n_trades,
+        }
+
+    def run_buy_and_hold(self, prices: Any) -> dict[str, Any]:
+        """Run a buy-and-hold benchmark.
+
+        Args:
+            prices: Array-like of close prices.
+
+        Returns:
+            Same structure as :meth:`run_vectorised`.
+        """
+        return self.run_vectorised(prices, lambda p: np.ones(len(p)))
diff --git a/synthetic-ai/simulation/monte_carlo.py b/synthetic-ai/simulation/monte_carlo.py
new file mode 100644
index 0000000..2507e2f
--- /dev/null
+++ b/synthetic-ai/simulation/monte_carlo.py
@@ -0,0 +1,197 @@
+"""Monte Carlo simulation: probabilistic scenario modelling.
+
+Provides :class:`MonteCarlo` for multi-path price simulation, portfolio
+terminal-value distributions, and Value-at-Risk estimation.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from scipy import stats
+from loguru import logger
+
+
+class MonteCarlo:
+    """Run Monte Carlo simulations for probabilistic financial modelling.
+
+    Supports multiple return distributions (normal, t-distribution, uniform)
+    and provides percentile-based risk metrics over the simulated ensemble.
+
+    Attributes:
+        n_simulations: Number of simulation paths.
+        seed: Random seed.
+        distribution: Return distribution (``"normal"``, ``"t"``, or
+            ``"uniform"``).
+        t_df: Degrees of freedom for the Student-t distribution.
+    """
+
+    def __init__(
+        self,
+        n_simulations: int = 10_000,
+        seed: int | None = None,
+        distribution: str = "normal",
+        t_df: float = 5.0,
+    ) -> None:
+        """Initialise MonteCarlo.
+
+        Args:
+            n_simulations: Number of Monte Carlo paths.
+            seed: Random seed for reproducibility.
+            distribution: Sampling distribution for returns.
+            t_df: Degrees of freedom for Student-t (only used when
+                distribution = ``"t"``).
+
+        Raises:
+            ValueError: If distribution is not supported.
+        """
+        supported = ("normal", "t", "uniform")
+        if distribution not in supported:
+            raise ValueError(f"distribution must be one of {supported}.")
+        self.n_simulations = n_simulations
+        self.seed = seed
+        self.distribution = distribution
+        self.t_df = t_df
+        self._rng = np.random.default_rng(seed)
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _sample_returns(self, mu: float, sigma: float, n_steps: int) -> np.ndarray:
+        """Sample a return matrix from the configured distribution.
+
+        Args:
+            mu: Per-step mean return.
+            sigma: Per-step standard deviation.
+            n_steps: Number of steps per path.
+
+        Returns:
+            Return matrix of shape ``(n_simulations, n_steps)``.
+        """
+        shape = (self.n_simulations, n_steps)
+        if self.distribution == "normal":
+            return self._rng.normal(mu, sigma, shape)
+        if self.distribution == "t":
+            raw = self._rng.standard_t(self.t_df, shape)
+            raw_std = np.sqrt(self.t_df / (self.t_df - 2)) if self.t_df > 2 else 1.0
+            return mu + sigma * raw / raw_std
+        # uniform
+        half = sigma * np.sqrt(3)
+        return self._rng.uniform(mu - half, mu + half, shape)
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def simulate_paths(
+        self,
+        s0: float,
+        mu: float,
+        sigma: float,
+        n_steps: int,
+        dt: float = 1 / 252,
+    ) -> np.ndarray:
+        """Simulate price paths using log-normal evolution.
+
+        Args:
+            s0: Initial price.
+            mu: Annual drift.
+            sigma: Annual volatility.
+            n_steps: Number of time steps.
+            dt: Step size in years.
+
+        Returns:
+            Price matrix of shape ``(n_simulations, n_steps + 1)``.
+        """
+        step_mu = (mu - 0.5 * sigma ** 2) * dt
+        step_sigma = sigma * np.sqrt(dt)
+        log_returns = self._sample_returns(step_mu, step_sigma, n_steps)
+        log_prices = np.concatenate(
+            [np.full((self.n_simulations, 1), np.log(s0)), np.cumsum(log_returns, axis=1)],
+            axis=1,
+        )
+        return np.exp(log_prices)
+
+    def terminal_distribution(
+        self,
+        s0: float,
+        mu: float,
+        sigma: float,
+        n_steps: int,
+        dt: float = 1 / 252,
+    ) -> dict[str, Any]:
+        """Compute statistics of the terminal price distribution.
+
+        Args:
+            s0: Initial price.
+            mu: Annual drift.
+            sigma: Annual volatility.
+            n_steps: Number of steps to horizon.
+            dt: Step size in years.
+
+        Returns:
+            Dict with percentile prices, mean, std, skewness, kurtosis,
+            VaR at 95%, and probability of loss.
+        """
+        paths = self.simulate_paths(s0, mu, sigma, n_steps, dt)
+        terminals = paths[:, -1]
+
+        returns = (terminals - s0) / s0
+        var_95 = float(np.percentile(returns, 5))
+
+        logger.debug(
+            f"Monte Carlo terminal distribution: mean={float(np.mean(terminals)):.2f}, "
+            f"std={float(np.std(terminals)):.2f}"
+        )
+        return {
+            "mean_price": float(np.mean(terminals)),
+            "std_price": float(np.std(terminals)),
+            "median_price": float(np.median(terminals)),
+            "p5_price": float(np.percentile(terminals, 5)),
+            "p25_price": float(np.percentile(terminals, 25)),
+            "p75_price": float(np.percentile(terminals, 75)),
+            "p95_price": float(np.percentile(terminals, 95)),
+            "skewness": float(stats.skew(terminals)),
+            "kurtosis": float(stats.kurtosis(terminals)),
+            "var_95_return": var_95,
+            "prob_loss": float(np.mean(terminals < s0)),
+            "n_simulations": self.n_simulations,
+        }
+
+    def estimate_var(
+        self,
+        portfolio_value: float,
+        mu: float,
+        sigma: float,
+        horizon_days: int = 1,
+        confidence_level: float = 0.95,
+    ) -> dict[str, float]:
+        """Estimate portfolio Value-at-Risk via Monte Carlo.
+
+        Args:
+            portfolio_value: Current portfolio value.
+            mu: Daily expected return.
+            sigma: Daily volatility.
+            horizon_days: Risk horizon in days.
+            confidence_level: Confidence level (e.g., 0.95).
+
+        Returns:
+            Dict with ``var_amount``, ``var_pct``, ``cvar_amount``, ``cvar_pct``.
+        """
+        paths = self.simulate_paths(portfolio_value, mu, sigma, horizon_days, dt=1.0)
+        terminals = paths[:, -1]
+        returns = (terminals - portfolio_value) / portfolio_value
+
+        cutoff_pct = (1 - confidence_level) * 100
+        var_pct = float(-np.percentile(returns, cutoff_pct))
+        tail_returns = returns[returns <= -var_pct]
+        cvar_pct = float(-np.mean(tail_returns)) if len(tail_returns) > 0 else var_pct
+
+        return {
+            "var_amount": round(portfolio_value * var_pct, 2),
+            "var_pct": round(var_pct, 6),
+            "cvar_amount": round(portfolio_value * cvar_pct, 2),
+            "cvar_pct": round(cvar_pct, 6),
+        }
diff --git a/synthetic-ai/validation/__init__.py b/synthetic-ai/validation/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/synthetic-ai/validation/__pycache__/__init__.cpython-312.pyc b/synthetic-ai/validation/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..c7a7626
Binary files /dev/null and b/synthetic-ai/validation/__pycache__/__init__.cpython-312.pyc differ
diff --git a/synthetic-ai/validation/__pycache__/distribution_matcher.cpython-312.pyc b/synthetic-ai/validation/__pycache__/distribution_matcher.cpython-312.pyc
new file mode 100644
index 0000000..cdacb62
Binary files /dev/null and b/synthetic-ai/validation/__pycache__/distribution_matcher.cpython-312.pyc differ
diff --git a/synthetic-ai/validation/__pycache__/reality_checker.cpython-312.pyc b/synthetic-ai/validation/__pycache__/reality_checker.cpython-312.pyc
new file mode 100644
index 0000000..6492d54
Binary files /dev/null and b/synthetic-ai/validation/__pycache__/reality_checker.cpython-312.pyc differ
diff --git a/synthetic-ai/validation/distribution_matcher.py b/synthetic-ai/validation/distribution_matcher.py
new file mode 100644
index 0000000..6e6f8ea
--- /dev/null
+++ b/synthetic-ai/validation/distribution_matcher.py
@@ -0,0 +1,193 @@
+"""Distribution matching: statistical distribution validation using moments.
+
+Provides :class:`DistributionMatcher` for comparing empirical moments and
+fitting parametric distributions to financial return data.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from scipy import stats
+from loguru import logger
+
+
+class DistributionMatcher:
+    """Validate and match statistical distributions for financial returns.
+
+    Computes the first four statistical moments, fits candidate parametric
+    distributions, and selects the best fit by AIC criterion.
+
+    Attributes:
+        candidate_distributions: Distributions to consider for fitting.
+        moment_tolerances: Acceptable relative error for each moment.
+    """
+
+    _DEFAULT_CANDIDATES: list[str] = ["norm", "t", "laplace", "logistic", "gennorm"]
+
+    def __init__(
+        self,
+        candidate_distributions: list[str] | None = None,
+        moment_tolerances: dict[str, float] | None = None,
+    ) -> None:
+        """Initialise DistributionMatcher.
+
+        Args:
+            candidate_distributions: List of scipy.stats distribution names
+                to consider.
+            moment_tolerances: Dict mapping moment names (``"mean"``, ``"std"``,
+                ``"skewness"``, ``"kurtosis"``) to acceptable relative errors.
+        """
+        self.candidate_distributions = (
+            candidate_distributions or self._DEFAULT_CANDIDATES
+        )
+        self.moment_tolerances = moment_tolerances or {
+            "mean": 0.5,
+            "std": 0.2,
+            "skewness": 0.5,
+            "kurtosis": 1.0,
+        }
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def _compute_moments(data: np.ndarray) -> dict[str, float]:
+        """Compute the first four standardised moments.
+
+        Args:
+            data: 1-D array of observations.
+
+        Returns:
+            Dict with ``mean``, ``std``, ``skewness``, ``kurtosis`` (excess).
+        """
+        return {
+            "mean": float(np.mean(data)),
+            "std": float(np.std(data, ddof=1)),
+            "skewness": float(stats.skew(data)),
+            "kurtosis": float(stats.kurtosis(data)),
+        }
+
+    def _fit_distribution(
+        self, dist_name: str, data: np.ndarray
+    ) -> dict[str, Any] | None:
+        """Fit a parametric distribution and compute AIC.
+
+        Args:
+            dist_name: scipy.stats distribution name.
+            data: Sample data array.
+
+        Returns:
+            Dict with ``distribution``, ``params``, ``aic``, or None on
+            failure.
+        """
+        try:
+            dist = getattr(stats, dist_name)
+            params = dist.fit(data)
+            log_lik = np.sum(dist.logpdf(data, *params))
+            k = len(params)
+            aic = 2 * k - 2 * float(log_lik)
+            return {"distribution": dist_name, "params": params, "aic": aic}
+        except Exception as exc:
+            logger.debug(f"Failed to fit {dist_name}: {exc}")
+            return None
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def compute_moments(self, data: Any) -> dict[str, float]:
+        """Compute descriptive statistics and moments of a data series.
+
+        Args:
+            data: Array-like of numeric values.
+
+        Returns:
+            Moments dict: ``mean``, ``std``, ``skewness``, ``kurtosis``.
+
+        Raises:
+            ValueError: If fewer than 4 data points are provided.
+        """
+        arr = np.asarray(data, dtype=np.float64).ravel()
+        if len(arr) < 4:
+            raise ValueError("At least 4 data points are required.")
+        return self._compute_moments(arr)
+
+    def fit_best_distribution(
+        self, data: Any
+    ) -> dict[str, Any]:
+        """Fit candidate distributions and return the best by AIC.
+
+        Args:
+            data: Array-like of return observations.
+
+        Returns:
+            Dict with keys ``best_distribution``, ``best_aic``, ``best_params``,
+            and ``all_fits`` (list of all candidate results).
+        """
+        arr = np.asarray(data, dtype=np.float64).ravel()
+        if len(arr) < 10:
+            raise ValueError("At least 10 data points are required for distribution fitting.")
+
+        fits = []
+        for dist_name in self.candidate_distributions:
+            result = self._fit_distribution(dist_name, arr)
+            if result is not None:
+                fits.append(result)
+
+        if not fits:
+            raise RuntimeError("No distributions could be fitted to the data.")
+
+        best = min(fits, key=lambda x: x["aic"])
+        logger.debug(
+            f"Best distribution: {best['distribution']}, AIC={best['aic']:.2f}"
+        )
+        return {
+            "best_distribution": best["distribution"],
+            "best_aic": round(best["aic"], 4),
+            "best_params": best["params"],
+            "all_fits": [
+                {"distribution": f["distribution"], "aic": round(f["aic"], 4)}
+                for f in sorted(fits, key=lambda x: x["aic"])
+            ],
+        }
+
+    def compare_moments(
+        self,
+        real_data: Any,
+        synthetic_data: Any,
+    ) -> dict[str, Any]:
+        """Compare moments between real and synthetic datasets.
+
+        Args:
+            real_data: Reference data array.
+            synthetic_data: Synthetic data array to validate.
+
+        Returns:
+            Dict with per-moment comparisons and a ``passed`` flag.
+        """
+        real_arr = np.asarray(real_data, dtype=np.float64).ravel()
+        synth_arr = np.asarray(synthetic_data, dtype=np.float64).ravel()
+
+        real_m = self._compute_moments(real_arr)
+        synth_m = self._compute_moments(synth_arr)
+
+        comparisons: dict[str, Any] = {}
+        for moment_name in ("mean", "std", "skewness", "kurtosis"):
+            rv = real_m[moment_name]
+            sv = synth_m[moment_name]
+            tol = self.moment_tolerances.get(moment_name, 0.5)
+            rel_err = abs(rv - sv) / (abs(rv) + 1e-9)
+            comparisons[moment_name] = {
+                "real": round(rv, 6),
+                "synthetic": round(sv, 6),
+                "relative_error": round(rel_err, 6),
+                "tolerance": tol,
+                "passed": rel_err <= tol,
+            }
+
+        overall = all(v["passed"] for v in comparisons.values())
+        logger.debug(f"Moment comparison: overall_passed={overall}")
+        return {"passed": overall, "moments": comparisons}
diff --git a/synthetic-ai/validation/reality_checker.py b/synthetic-ai/validation/reality_checker.py
new file mode 100644
index 0000000..08bb876
--- /dev/null
+++ b/synthetic-ai/validation/reality_checker.py
@@ -0,0 +1,171 @@
+"""Reality checking: validate synthetic data against real data distributions.
+
+Provides :class:`RealityChecker` using Kolmogorov-Smirnov tests, correlation
+checks, and autocorrelation comparisons.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from scipy import stats
+from loguru import logger
+
+
+class RealityChecker:
+    """Validate synthetic financial time series against real data.
+
+    Runs a battery of statistical tests to ensure that synthetic data
+    plausibly replicates the key statistical properties of real market data.
+
+    Tests performed:
+
+    * **KS test** on return distributions.
+    * **Mean / std comparison** (z-test on means).
+    * **Autocorrelation** check (first-order lag-1 ACF).
+    * **Tail ratio** (95th percentile / 5th percentile returns).
+    * **Variance ratio** test for random-walk properties.
+
+    Attributes:
+        ks_alpha: Significance level for KS test.
+        mean_tol: Tolerance for mean comparison (absolute difference).
+        std_tol: Tolerance for std comparison (relative difference).
+    """
+
+    def __init__(
+        self,
+        ks_alpha: float = 0.05,
+        mean_tol: float = 0.002,
+        std_tol: float = 0.20,
+    ) -> None:
+        """Initialise RealityChecker.
+
+        Args:
+            ks_alpha: KS test significance level.
+            mean_tol: Absolute tolerance for mean return comparison.
+            std_tol: Relative tolerance for std comparison.
+        """
+        self.ks_alpha = ks_alpha
+        self.mean_tol = mean_tol
+        self.std_tol = std_tol
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def _price_to_returns(prices: Any) -> np.ndarray:
+        """Convert prices to log-returns.
+
+        Args:
+            prices: Array-like of prices.
+
+        Returns:
+            Log-return array.
+        """
+        arr = np.asarray(prices, dtype=np.float64)
+        return np.diff(np.log(arr))
+
+    @staticmethod
+    def _acf_lag1(returns: np.ndarray) -> float:
+        """Compute lag-1 autocorrelation.
+
+        Args:
+            returns: Return array.
+
+        Returns:
+            Lag-1 Pearson correlation coefficient.
+        """
+        if len(returns) < 3:
+            return 0.0
+        return float(np.corrcoef(returns[:-1], returns[1:])[0, 1])
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def check(
+        self,
+        real_prices: Any,
+        synthetic_prices: Any,
+    ) -> dict[str, Any]:
+        """Run full reality-check battery.
+
+        Args:
+            real_prices: Array-like of real market prices.
+            synthetic_prices: Array-like of synthetic prices.
+
+        Returns:
+            Dict with test names as keys and result dicts as values, plus an
+            overall ``passed`` flag.
+
+        Raises:
+            ValueError: If either price series has fewer than 10 data points.
+        """
+        real_r = self._price_to_returns(real_prices)
+        synth_r = self._price_to_returns(synthetic_prices)
+
+        for name, arr in [("real", real_r), ("synthetic", synth_r)]:
+            if len(arr) < 10:
+                raise ValueError(f"{name} prices must yield at least 10 returns.")
+
+        results: dict[str, Any] = {}
+
+        # 1. KS test
+        ks_stat, ks_pvalue = stats.ks_2samp(real_r, synth_r)
+        results["ks_test"] = {
+            "statistic": round(float(ks_stat), 6),
+            "p_value": round(float(ks_pvalue), 6),
+            "passed": ks_pvalue >= self.ks_alpha,
+        }
+
+        # 2. Mean comparison
+        real_mean = float(np.mean(real_r))
+        synth_mean = float(np.mean(synth_r))
+        mean_diff = abs(real_mean - synth_mean)
+        results["mean_comparison"] = {
+            "real_mean": round(real_mean, 6),
+            "synth_mean": round(synth_mean, 6),
+            "abs_diff": round(mean_diff, 6),
+            "passed": mean_diff <= self.mean_tol,
+        }
+
+        # 3. Std comparison
+        real_std = float(np.std(real_r, ddof=1))
+        synth_std = float(np.std(synth_r, ddof=1))
+        rel_diff = abs(real_std - synth_std) / (real_std + 1e-9)
+        results["std_comparison"] = {
+            "real_std": round(real_std, 6),
+            "synth_std": round(synth_std, 6),
+            "relative_diff": round(rel_diff, 6),
+            "passed": rel_diff <= self.std_tol,
+        }
+
+        # 4. Autocorrelation
+        real_acf = self._acf_lag1(real_r)
+        synth_acf = self._acf_lag1(synth_r)
+        acf_diff = abs(real_acf - synth_acf)
+        results["autocorrelation"] = {
+            "real_acf1": round(real_acf, 6),
+            "synth_acf1": round(synth_acf, 6),
+            "abs_diff": round(acf_diff, 6),
+            "passed": acf_diff < 0.1,
+        }
+
+        # 5. Tail ratio
+        real_tail = float(np.percentile(real_r, 95)) / (abs(float(np.percentile(real_r, 5))) + 1e-9)
+        synth_tail = float(np.percentile(synth_r, 95)) / (abs(float(np.percentile(synth_r, 5))) + 1e-9)
+        tail_diff = abs(real_tail - synth_tail)
+        results["tail_ratio"] = {
+            "real_tail_ratio": round(real_tail, 4),
+            "synth_tail_ratio": round(synth_tail, 4),
+            "abs_diff": round(tail_diff, 4),
+            "passed": tail_diff < 0.5,
+        }
+
+        overall = all(v["passed"] for v in results.values())
+        n_passed = sum(1 for v in results.values() if v["passed"])
+        logger.info(f"Reality check: {n_passed}/{len(results)} tests passed")
+
+        return {"passed": overall, "tests": results, "n_passed": n_passed, "n_total": len(results)}
diff --git a/vertical-ai/__init__.py b/vertical-ai/__init__.py
new file mode 100644
index 0000000..b23a79c
--- /dev/null
+++ b/vertical-ai/__init__.py
@@ -0,0 +1,115 @@
+"""Vertical AI – domain-specific trading intelligence module.
+
+This package exposes the :class:`VerticalAI` orchestrator which wires together
+market analysis, risk management, order execution, and compliance sub-systems.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from typing import Any
+
+from loguru import logger
+
+from vertical_ai.market_analysis.technical_analyzer import TechnicalAnalyzer
+from vertical_ai.market_analysis.fundamental_analyzer import FundamentalAnalyzer
+from vertical_ai.market_analysis.sentiment_analyzer import SentimentAnalyzer
+from vertical_ai.market_analysis.orderbook_analyzer import OrderBookAnalyzer
+from vertical_ai.risk_management.portfolio_risk import PortfolioRisk
+from vertical_ai.risk_management.position_sizer import PositionSizer
+from vertical_ai.risk_management.correlation_analyzer import CorrelationAnalyzer
+from vertical_ai.execution.smart_order_router import SmartOrderRouter
+from vertical_ai.execution.slippage_predictor import SlippagePredictor
+from vertical_ai.execution.market_impact_model import MarketImpactModel
+from vertical_ai.compliance.regulatory_checker import RegulatoryChecker
+from vertical_ai.compliance.audit_logger import AuditLogger
+
+
+class VerticalAI:
+    """Top-level orchestrator for the Vertical AI trading intelligence stack.
+
+    Wires together all sub-systems and exposes a unified async interface for
+    market analysis, risk evaluation, order routing, and compliance checks.
+
+    Attributes:
+        technical: Technical chart-pattern and indicator analyser.
+        fundamental: Financial-ratio analyser.
+        sentiment: News / social-media sentiment scorer.
+        orderbook: Market-depth and liquidity analyser.
+        portfolio_risk: VaR / CVaR / drawdown risk engine.
+        position_sizer: Kelly / fixed-fraction / vol-targeting sizer.
+        correlation: Rolling asset-correlation tracker.
+        router: Smart order router.
+        slippage: Slippage cost predictor.
+        market_impact: Square-root market-impact model.
+        compliance: Regulatory rule checker.
+        audit: Structured audit logger.
+    """
+
+    def __init__(self, config: dict[str, Any] | None = None) -> None:
+        """Initialise VerticalAI and all sub-systems.
+
+        Args:
+            config: Optional configuration overrides keyed by sub-system name.
+        """
+        cfg = config or {}
+        logger.info("Initialising VerticalAI")
+
+        self.technical = TechnicalAnalyzer(**cfg.get("technical", {}))
+        self.fundamental = FundamentalAnalyzer(**cfg.get("fundamental", {}))
+        self.sentiment = SentimentAnalyzer(**cfg.get("sentiment", {}))
+        self.orderbook = OrderBookAnalyzer(**cfg.get("orderbook", {}))
+
+        self.portfolio_risk = PortfolioRisk(**cfg.get("portfolio_risk", {}))
+        self.position_sizer = PositionSizer(**cfg.get("position_sizer", {}))
+        self.correlation = CorrelationAnalyzer(**cfg.get("correlation", {}))
+
+        self.router = SmartOrderRouter(**cfg.get("router", {}))
+        self.slippage = SlippagePredictor(**cfg.get("slippage", {}))
+        self.market_impact = MarketImpactModel(**cfg.get("market_impact", {}))
+
+        self.compliance = RegulatoryChecker(**cfg.get("compliance", {}))
+        self.audit = AuditLogger(**cfg.get("audit", {}))
+
+        logger.info("VerticalAI initialised successfully")
+
+    async def full_analysis(
+        self,
+        ohlcv_data: dict[str, Any],
+        orderbook: dict[str, Any],
+        financial_data: dict[str, Any],
+        texts: list[str],
+    ) -> dict[str, Any]:
+        """Run all market-analysis components concurrently.
+
+        Args:
+            ohlcv_data: OHLCV price data dict with keys ``open``, ``high``,
+                ``low``, ``close``, ``volume`` as array-like sequences.
+            orderbook: Order-book snapshot with ``bids`` and ``asks`` lists of
+                ``[price, size]`` pairs.
+            financial_data: Company financial metrics dict.
+            texts: List of news / social-media text strings to score.
+
+        Returns:
+            Aggregated analysis results keyed by sub-system name.
+
+        Raises:
+            ValueError: If any required data field is missing.
+        """
+        logger.info("Starting full market analysis")
+        technical_task = self.technical.analyze(ohlcv_data)
+        orderbook_task = self.orderbook.analyze(orderbook)
+        results = await asyncio.gather(technical_task, orderbook_task)
+
+        fundamental_result = self.fundamental.analyze_fundamentals(financial_data)
+        sentiment_result = self.sentiment.analyze_sentiment(texts)
+
+        return {
+            "technical": results[0],
+            "orderbook": results[1],
+            "fundamental": fundamental_result,
+            "sentiment": sentiment_result,
+        }
+
+
+__all__ = ["VerticalAI"]
diff --git a/vertical-ai/compliance/__init__.py b/vertical-ai/compliance/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/vertical-ai/compliance/__pycache__/__init__.cpython-312.pyc b/vertical-ai/compliance/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..ce25196
Binary files /dev/null and b/vertical-ai/compliance/__pycache__/__init__.cpython-312.pyc differ
diff --git a/vertical-ai/compliance/__pycache__/audit_logger.cpython-312.pyc b/vertical-ai/compliance/__pycache__/audit_logger.cpython-312.pyc
new file mode 100644
index 0000000..74459fd
Binary files /dev/null and b/vertical-ai/compliance/__pycache__/audit_logger.cpython-312.pyc differ
diff --git a/vertical-ai/compliance/__pycache__/regulatory_checker.cpython-312.pyc b/vertical-ai/compliance/__pycache__/regulatory_checker.cpython-312.pyc
new file mode 100644
index 0000000..3612925
Binary files /dev/null and b/vertical-ai/compliance/__pycache__/regulatory_checker.cpython-312.pyc differ
diff --git a/vertical-ai/compliance/audit_logger.py b/vertical-ai/compliance/audit_logger.py
new file mode 100644
index 0000000..bb9c6bf
--- /dev/null
+++ b/vertical-ai/compliance/audit_logger.py
@@ -0,0 +1,231 @@
+"""Audit logging: structured event logging for all trading activity.
+
+Provides :class:`AuditLogger` which persists structured JSON log records for
+orders, executions, risk events, and compliance decisions.
+"""
+
+from __future__ import annotations
+
+import json
+import os
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Any
+
+from loguru import logger
+
+
+class AuditLogger:
+    """Write structured audit records for trading events.
+
+    Records are written to a line-delimited JSON (JSONL) file and also emitted
+    via :mod:`loguru` at the ``INFO`` level for real-time monitoring.
+
+    Attributes:
+        log_dir: Directory where audit log files are stored.
+        log_file: Path of the active audit log file.
+        max_file_size_mb: File size at which rotation is triggered.
+    """
+
+    _VALID_EVENT_TYPES: frozenset[str] = frozenset(
+        [
+            "order_submitted",
+            "order_filled",
+            "order_cancelled",
+            "order_rejected",
+            "risk_alert",
+            "compliance_check",
+            "position_update",
+            "pnl_snapshot",
+            "system_event",
+        ]
+    )
+
+    def __init__(
+        self,
+        log_dir: str = "logs/audit",
+        max_file_size_mb: float = 100.0,
+    ) -> None:
+        """Initialise AuditLogger.
+
+        Args:
+            log_dir: Directory for audit log files (created if absent).
+            max_file_size_mb: Maximum log file size before rotation.
+        """
+        self.log_dir = Path(log_dir)
+        self.log_dir.mkdir(parents=True, exist_ok=True)
+        self.max_file_size_bytes = int(max_file_size_mb * 1024 * 1024)
+        self._session_id = datetime.now(timezone.utc).strftime("%Y%m%dT%H%M%S")
+        self.log_file = self.log_dir / f"audit_{self._session_id}.jsonl"
+        self._record_count = 0
+
+        logger.info(f"AuditLogger initialised: {self.log_file}")
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _should_rotate(self) -> bool:
+        """Check whether the current log file needs rotation.
+
+        Returns:
+            True if the file exceeds :attr:`max_file_size_bytes`.
+        """
+        try:
+            return self.log_file.stat().st_size >= self.max_file_size_bytes
+        except FileNotFoundError:
+            return False
+
+    def _rotate(self) -> None:
+        """Rotate the log file by starting a new one with a sequence suffix."""
+        self._session_id = datetime.now(timezone.utc).strftime("%Y%m%dT%H%M%S")
+        self.log_file = self.log_dir / f"audit_{self._session_id}.jsonl"
+        logger.info(f"Audit log rotated: {self.log_file}")
+
+    def _write_record(self, record: dict[str, Any]) -> None:
+        """Append a JSON record to the audit log file.
+
+        Args:
+            record: Serialisable dict to write.
+        """
+        if self._should_rotate():
+            self._rotate()
+        with self.log_file.open("a", encoding="utf-8") as fh:
+            fh.write(json.dumps(record, default=str) + "\n")
+        self._record_count += 1
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def log_event(
+        self,
+        event_type: str,
+        data: dict[str, Any],
+        severity: str = "INFO",
+    ) -> dict[str, Any]:
+        """Log a trading event.
+
+        Args:
+            event_type: One of the supported event type strings.
+            data: Arbitrary event payload.
+            severity: ``"DEBUG"``, ``"INFO"``, ``"WARNING"``, or ``"ERROR"``.
+
+        Returns:
+            The complete audit record dict (including auto-generated fields).
+
+        Raises:
+            ValueError: If *event_type* is not in the supported set.
+        """
+        if event_type not in self._VALID_EVENT_TYPES:
+            raise ValueError(
+                f"Unknown event_type '{event_type}'. "
+                f"Supported: {sorted(self._VALID_EVENT_TYPES)}"
+            )
+
+        record: dict[str, Any] = {
+            "timestamp": datetime.now(timezone.utc).isoformat(),
+            "event_type": event_type,
+            "severity": severity,
+            "sequence": self._record_count + 1,
+            **data,
+        }
+
+        self._write_record(record)
+        log_fn = getattr(logger, severity.lower(), logger.info)
+        log_fn(f"[AUDIT] {event_type}: {json.dumps(data, default=str)[:200]}")
+        return record
+
+    def log_order(
+        self,
+        order_id: str,
+        symbol: str,
+        side: str,
+        size: float,
+        price: float | None,
+        status: str,
+        extra: dict[str, Any] | None = None,
+    ) -> dict[str, Any]:
+        """Log an order lifecycle event.
+
+        Args:
+            order_id: Unique order identifier.
+            symbol: Instrument symbol.
+            side: ``"buy"`` or ``"sell"``.
+            size: Order size.
+            price: Limit price (None for market orders).
+            status: Order status string (e.g., ``"submitted"``).
+            extra: Additional fields to include in the record.
+
+        Returns:
+            Audit record dict.
+        """
+        event_type = f"order_{status}" if f"order_{status}" in self._VALID_EVENT_TYPES else "order_submitted"
+        return self.log_event(
+            event_type,
+            {
+                "order_id": order_id,
+                "symbol": symbol,
+                "side": side,
+                "size": size,
+                "price": price,
+                "status": status,
+                **(extra or {}),
+            },
+        )
+
+    def log_risk_alert(
+        self,
+        alert_type: str,
+        symbol: str | None,
+        metric: str,
+        value: float,
+        threshold: float,
+        extra: dict[str, Any] | None = None,
+    ) -> dict[str, Any]:
+        """Log a risk management alert.
+
+        Args:
+            alert_type: Short descriptor (e.g., ``"var_breach"``).
+            symbol: Affected symbol or None for portfolio-level alerts.
+            metric: Risk metric name.
+            value: Current metric value.
+            threshold: Breach threshold.
+            extra: Additional context.
+
+        Returns:
+            Audit record dict.
+        """
+        return self.log_event(
+            "risk_alert",
+            {
+                "alert_type": alert_type,
+                "symbol": symbol,
+                "metric": metric,
+                "value": value,
+                "threshold": threshold,
+                **(extra or {}),
+            },
+            severity="WARNING",
+        )
+
+    def get_recent_records(self, n: int = 100) -> list[dict[str, Any]]:
+        """Read the most recent *n* records from the active log file.
+
+        Args:
+            n: Number of records to return.
+
+        Returns:
+            List of parsed record dicts (oldest first within the slice).
+        """
+        try:
+            lines = self.log_file.read_text(encoding="utf-8").splitlines()
+            records = []
+            for line in lines[-n:]:
+                try:
+                    records.append(json.loads(line))
+                except json.JSONDecodeError:
+                    continue
+            return records
+        except FileNotFoundError:
+            return []
diff --git a/vertical-ai/compliance/regulatory_checker.py b/vertical-ai/compliance/regulatory_checker.py
new file mode 100644
index 0000000..a8bb80f
--- /dev/null
+++ b/vertical-ai/compliance/regulatory_checker.py
@@ -0,0 +1,272 @@
+"""Regulatory compliance: position limits, wash trading, and PDT checks.
+
+Provides :class:`RegulatoryChecker` for pre-trade and post-trade compliance
+validation.
+"""
+
+from __future__ import annotations
+
+import re
+from collections import defaultdict
+from datetime import datetime, timedelta, timezone
+from typing import Any
+
+from loguru import logger
+
+
+class RegulatoryChecker:
+    """Check proposed and executed trades against regulatory rules.
+
+    Implements three key compliance checks:
+
+    1. **Position limits** – rejects orders that would breach per-asset or
+       portfolio gross exposure limits.
+    2. **Wash trading detection** – flags buy-then-sell (or vice versa) of the
+       same instrument within a configurable window.
+    3. **Pattern Day Trading (PDT)** – counts day-trade round-trips in a
+       rolling 5-trading-day window and enforces the FINRA 3-trip limit for
+       accounts below the minimum equity threshold.
+
+    Attributes:
+        position_limits: Per-symbol maximum absolute position size.
+        portfolio_limit: Maximum sum of absolute positions across all symbols.
+        wash_trade_window_secs: Time window to detect wash trades.
+        pdt_account_minimum: Equity threshold below which PDT applies.
+        pdt_max_day_trades: Maximum day trades per rolling 5-day window.
+    """
+
+    def __init__(
+        self,
+        position_limits: dict[str, float] | None = None,
+        portfolio_limit: float = 1_000_000.0,
+        wash_trade_window_secs: int = 30,
+        pdt_account_minimum: float = 25_000.0,
+        pdt_max_day_trades: int = 3,
+    ) -> None:
+        """Initialise RegulatoryChecker.
+
+        Args:
+            position_limits: Symbol → max absolute position size.
+            portfolio_limit: Maximum total gross exposure.
+            wash_trade_window_secs: Seconds within which a buy followed by a
+                sell (or vice versa) of the same symbol is flagged as wash.
+            pdt_account_minimum: Account equity below which PDT rules apply.
+            pdt_max_day_trades: Allowed day trades per rolling 5-day window.
+        """
+        self.position_limits: dict[str, float] = position_limits or {}
+        self.portfolio_limit = portfolio_limit
+        self.wash_trade_window_secs = wash_trade_window_secs
+        self.pdt_account_minimum = pdt_account_minimum
+        self.pdt_max_day_trades = pdt_max_day_trades
+
+        # Internal state for wash-trade and PDT tracking
+        self._recent_trades: dict[str, list[dict[str, Any]]] = defaultdict(list)
+        self._day_trades: list[datetime] = []
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _prune_old_trades(self, symbol: str, now: datetime) -> None:
+        """Remove wash-trade records outside the detection window.
+
+        Args:
+            symbol: Instrument symbol.
+            now: Current UTC datetime.
+        """
+        cutoff = now - timedelta(seconds=self.wash_trade_window_secs)
+        self._recent_trades[symbol] = [
+            t for t in self._recent_trades[symbol]
+            if t["timestamp"] >= cutoff
+        ]
+
+    def _prune_old_day_trades(self, now: datetime) -> None:
+        """Remove PDT records older than 5 calendar days.
+
+        Args:
+            now: Current UTC datetime.
+        """
+        cutoff = now - timedelta(days=5)
+        self._day_trades = [dt for dt in self._day_trades if dt >= cutoff]
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def check_position_limit(
+        self,
+        symbol: str,
+        current_position: float,
+        order_size: float,
+        side: str,
+    ) -> dict[str, Any]:
+        """Check whether an order would breach position limits.
+
+        Args:
+            symbol: Instrument symbol.
+            current_position: Current signed position (positive = long).
+            order_size: Unsigned order size.
+            side: ``"buy"`` or ``"sell"``.
+
+        Returns:
+            Dict with keys ``passed`` (bool), ``reason`` (str or None),
+            ``resulting_position`` (float), ``limit`` (float).
+        """
+        delta = order_size if side == "buy" else -order_size
+        resulting = current_position + delta
+        limit = self.position_limits.get(symbol, float("inf"))
+
+        if abs(resulting) > limit:
+            logger.warning(f"Position limit breach: {symbol} → {resulting} > {limit}")
+            return {
+                "passed": False,
+                "reason": (
+                    f"Position {resulting:.0f} exceeds limit {limit:.0f} for {symbol}"
+                ),
+                "resulting_position": resulting,
+                "limit": limit,
+            }
+        return {"passed": True, "reason": None, "resulting_position": resulting, "limit": limit}
+
+    def check_portfolio_limit(
+        self, positions: dict[str, float], prices: dict[str, float]
+    ) -> dict[str, Any]:
+        """Check gross portfolio exposure against the portfolio limit.
+
+        Args:
+            positions: Symbol → signed share position.
+            prices: Symbol → current price.
+
+        Returns:
+            Dict with keys ``passed``, ``gross_exposure``, ``limit``.
+        """
+        gross = sum(abs(pos) * prices.get(sym, 0.0) for sym, pos in positions.items())
+        passed = gross <= self.portfolio_limit
+        if not passed:
+            logger.warning(f"Portfolio limit breach: {gross:.2f} > {self.portfolio_limit:.2f}")
+        return {
+            "passed": passed,
+            "gross_exposure": round(gross, 2),
+            "limit": self.portfolio_limit,
+        }
+
+    def check_wash_trade(
+        self,
+        symbol: str,
+        side: str,
+        timestamp: datetime | None = None,
+    ) -> dict[str, Any]:
+        """Detect potential wash trading.
+
+        A wash trade is flagged when an opposite-side order for the same
+        symbol arrives within :attr:`wash_trade_window_secs`.
+
+        Args:
+            symbol: Instrument symbol.
+            side: ``"buy"`` or ``"sell"``.
+            timestamp: Order timestamp; defaults to ``datetime.now(UTC)``.
+
+        Returns:
+            Dict with keys ``passed`` (False = wash trade detected),
+            ``reason``, ``flagged_trades``.
+        """
+        now = timestamp or datetime.now(timezone.utc)
+        self._prune_old_trades(symbol, now)
+
+        opposite = "sell" if side == "buy" else "buy"
+        flagged = [
+            t for t in self._recent_trades[symbol] if t["side"] == opposite
+        ]
+
+        self._recent_trades[symbol].append({"side": side, "timestamp": now})
+
+        if flagged:
+            logger.warning(f"Wash trade detected: {symbol} {side} within window")
+            return {
+                "passed": False,
+                "reason": f"Wash trade: {symbol} {side} follows {opposite} within "
+                          f"{self.wash_trade_window_secs}s",
+                "flagged_trades": flagged,
+            }
+        return {"passed": True, "reason": None, "flagged_trades": []}
+
+    def check_pattern_day_trading(
+        self,
+        account_equity: float,
+        is_day_trade: bool,
+        timestamp: datetime | None = None,
+    ) -> dict[str, Any]:
+        """Enforce FINRA Pattern Day Trading rules.
+
+        Accounts below :attr:`pdt_account_minimum` are limited to
+        :attr:`pdt_max_day_trades` round-trips in a rolling 5-day window.
+
+        Args:
+            account_equity: Current account equity in USD.
+            is_day_trade: Whether the proposed trade is a day trade (same-day
+                open and close of the same instrument).
+            timestamp: Trade timestamp; defaults to ``datetime.now(UTC)``.
+
+        Returns:
+            Dict with keys ``passed``, ``reason``, ``day_trade_count``.
+        """
+        now = timestamp or datetime.now(timezone.utc)
+        self._prune_old_day_trades(now)
+
+        if is_day_trade:
+            self._day_trades.append(now)
+
+        count = len(self._day_trades)
+
+        if account_equity >= self.pdt_account_minimum:
+            return {"passed": True, "reason": None, "day_trade_count": count}
+
+        if count > self.pdt_max_day_trades:
+            logger.warning(f"PDT violation: {count} day trades, equity={account_equity:.2f}")
+            return {
+                "passed": False,
+                "reason": (
+                    f"PDT rule: {count} day trades exceed limit of "
+                    f"{self.pdt_max_day_trades} for accounts below "
+                    f"${self.pdt_account_minimum:,.0f}"
+                ),
+                "day_trade_count": count,
+            }
+        return {"passed": True, "reason": None, "day_trade_count": count}
+
+    def full_compliance_check(
+        self,
+        order: dict[str, Any],
+        positions: dict[str, float],
+        prices: dict[str, float],
+        account_equity: float,
+        is_day_trade: bool = False,
+    ) -> dict[str, Any]:
+        """Run all compliance checks for a proposed order.
+
+        Args:
+            order: Dict with keys ``symbol``, ``side``, ``size``,
+                optionally ``timestamp``.
+            positions: Current signed positions by symbol.
+            prices: Current prices by symbol.
+            account_equity: Account equity in USD.
+            is_day_trade: Whether the order is a day trade.
+
+        Returns:
+            Dict with ``passed`` (bool) and ``checks`` (per-rule results).
+        """
+        symbol = order["symbol"]
+        side = order["side"]
+        size = float(order["size"])
+        ts = order.get("timestamp")
+
+        results: dict[str, Any] = {}
+        results["position_limit"] = self.check_position_limit(
+            symbol, positions.get(symbol, 0.0), size, side
+        )
+        results["portfolio_limit"] = self.check_portfolio_limit(positions, prices)
+        results["wash_trade"] = self.check_wash_trade(symbol, side, ts)
+        results["pdt"] = self.check_pattern_day_trading(account_equity, is_day_trade, ts)
+
+        all_passed = all(v["passed"] for v in results.values())
+        return {"passed": all_passed, "checks": results}
diff --git a/vertical-ai/execution/__init__.py b/vertical-ai/execution/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/vertical-ai/execution/__pycache__/__init__.cpython-312.pyc b/vertical-ai/execution/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..65168c3
Binary files /dev/null and b/vertical-ai/execution/__pycache__/__init__.cpython-312.pyc differ
diff --git a/vertical-ai/execution/__pycache__/market_impact_model.cpython-312.pyc b/vertical-ai/execution/__pycache__/market_impact_model.cpython-312.pyc
new file mode 100644
index 0000000..35f6d28
Binary files /dev/null and b/vertical-ai/execution/__pycache__/market_impact_model.cpython-312.pyc differ
diff --git a/vertical-ai/execution/__pycache__/slippage_predictor.cpython-312.pyc b/vertical-ai/execution/__pycache__/slippage_predictor.cpython-312.pyc
new file mode 100644
index 0000000..7bc1f4e
Binary files /dev/null and b/vertical-ai/execution/__pycache__/slippage_predictor.cpython-312.pyc differ
diff --git a/vertical-ai/execution/__pycache__/smart_order_router.cpython-312.pyc b/vertical-ai/execution/__pycache__/smart_order_router.cpython-312.pyc
new file mode 100644
index 0000000..697bbad
Binary files /dev/null and b/vertical-ai/execution/__pycache__/smart_order_router.cpython-312.pyc differ
diff --git a/vertical-ai/execution/market_impact_model.py b/vertical-ai/execution/market_impact_model.py
new file mode 100644
index 0000000..9a11b05
--- /dev/null
+++ b/vertical-ai/execution/market_impact_model.py
@@ -0,0 +1,152 @@
+"""Market impact model: square-root and linear price-impact estimation.
+
+Provides :class:`MarketImpactModel` implementing the Almgren-Chriss square-root
+market-impact framework for estimating permanent and temporary price impact.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class MarketImpactModel:
+    """Estimate market impact of trades using the square-root model.
+
+    Decomposes total market impact into:
+
+    * **Temporary impact** – immediate, mean-reverting liquidity cost.
+    * **Permanent impact** – lasting price change from information content.
+
+    The model follows Almgren & Chriss (2001):
+        ``I_temp = eta * sigma * sqrt(v / ADV)``
+        ``I_perm = gamma * sigma * (v / ADV)``
+
+    where *v* is trade size, *ADV* is average daily volume, and *sigma* is
+    daily volatility.
+
+    Attributes:
+        eta: Temporary impact coefficient.
+        gamma: Permanent impact coefficient.
+        sigma_daily: Default daily return volatility (fraction).
+    """
+
+    def __init__(
+        self,
+        eta: float = 0.142,
+        gamma: float = 0.314,
+        sigma_daily: float = 0.02,
+    ) -> None:
+        """Initialise MarketImpactModel.
+
+        Args:
+            eta: Temporary impact coefficient (Almgren-Chriss eta).
+            gamma: Permanent impact coefficient (Almgren-Chriss gamma).
+            sigma_daily: Default daily volatility estimate (fraction).
+        """
+        self.eta = eta
+        self.gamma = gamma
+        self.sigma_daily = sigma_daily
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def estimate(
+        self,
+        order_size: float,
+        avg_daily_volume: float,
+        volatility: float | None = None,
+        side: str = "buy",
+    ) -> dict[str, float]:
+        """Estimate market impact for a single trade.
+
+        Args:
+            order_size: Order size in shares.
+            avg_daily_volume: Average daily trading volume in shares.
+            volatility: Daily return volatility; falls back to
+                :attr:`sigma_daily` if not provided.
+            side: ``"buy"`` or ``"sell"``.  Impact direction is signed
+                accordingly.
+
+        Returns:
+            Dict with keys ``temporary_impact_bps``, ``permanent_impact_bps``,
+            ``total_impact_bps``, ``participation_rate``.
+
+        Raises:
+            ValueError: If order_size or avg_daily_volume are non-positive,
+                or side is invalid.
+        """
+        if order_size <= 0:
+            raise ValueError("order_size must be positive.")
+        if avg_daily_volume <= 0:
+            raise ValueError("avg_daily_volume must be positive.")
+        if side not in ("buy", "sell"):
+            raise ValueError("side must be 'buy' or 'sell'.")
+
+        sigma = volatility if volatility is not None else self.sigma_daily
+        v_over_adv = order_size / avg_daily_volume
+        sign = 1.0 if side == "buy" else -1.0
+
+        temp_impact = self.eta * sigma * np.sqrt(v_over_adv) * 10_000
+        perm_impact = self.gamma * sigma * v_over_adv * 10_000
+
+        total_impact = sign * (temp_impact + perm_impact)
+
+        result = {
+            "temporary_impact_bps": round(float(sign * temp_impact), 4),
+            "permanent_impact_bps": round(float(sign * perm_impact), 4),
+            "total_impact_bps": round(float(total_impact), 4),
+            "participation_rate": round(float(v_over_adv), 6),
+        }
+        logger.debug(f"Market impact: {result}")
+        return result
+
+    def optimal_execution_schedule(
+        self,
+        total_shares: float,
+        avg_daily_volume: float,
+        n_slices: int = 10,
+        volatility: float | None = None,
+        risk_aversion: float = 1.0,
+    ) -> dict[str, Any]:
+        """Compute a TWAP-like schedule minimising expected impact plus variance.
+
+        Minimises a linear combination of expected market impact and execution
+        risk (price variance) by distributing the order evenly in time.
+
+        Args:
+            total_shares: Total shares to execute.
+            avg_daily_volume: Average daily volume.
+            n_slices: Number of equal time slices.
+            volatility: Daily volatility; defaults to :attr:`sigma_daily`.
+            risk_aversion: Lambda parameter trading off impact vs risk.
+
+        Returns:
+            Dict with keys ``schedule`` (list of slice sizes), ``total_cost_bps``,
+            ``execution_shortfall_bps``.
+        """
+        sigma = volatility if volatility is not None else self.sigma_daily
+        slice_size = total_shares / n_slices
+
+        impacts = []
+        for i in range(n_slices):
+            imp = self.estimate(slice_size, avg_daily_volume, sigma)
+            impacts.append(imp["total_impact_bps"])
+
+        total_cost = sum(abs(c) for c in impacts)
+        variance_penalty = risk_aversion * sigma * np.sqrt(n_slices) * 10_000
+        shortfall = total_cost + float(variance_penalty)
+
+        logger.debug(
+            f"Execution schedule: {n_slices} slices, "
+            f"total_cost={total_cost:.2f}bps, shortfall={shortfall:.2f}bps"
+        )
+        return {
+            "schedule": [slice_size] * n_slices,
+            "impact_per_slice_bps": impacts,
+            "total_cost_bps": round(total_cost, 4),
+            "execution_shortfall_bps": round(shortfall, 4),
+        }
diff --git a/vertical-ai/execution/slippage_predictor.py b/vertical-ai/execution/slippage_predictor.py
new file mode 100644
index 0000000..6e7c9ce
--- /dev/null
+++ b/vertical-ai/execution/slippage_predictor.py
@@ -0,0 +1,129 @@
+"""Slippage prediction: transaction cost estimation from market microstructure.
+
+Provides :class:`SlippagePredictor` which estimates expected slippage in basis
+points based on order size, spread, and volume characteristics.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class SlippagePredictor:
+    """Predict transaction slippage for a proposed trade.
+
+    Combines three cost components:
+
+    1. **Half-spread cost** – unavoidable cost of crossing the spread.
+    2. **Market impact** – price movement caused by the order itself.
+    3. **Timing cost** – adverse price drift during execution.
+
+    Attributes:
+        impact_factor: Scaling coefficient for the square-root impact term.
+        timing_factor: Scaling coefficient for the timing / drift cost.
+        adv_lookback: Number of periods used to estimate average daily volume.
+    """
+
+    def __init__(
+        self,
+        impact_factor: float = 0.1,
+        timing_factor: float = 0.05,
+        adv_lookback: int = 20,
+    ) -> None:
+        """Initialise SlippagePredictor.
+
+        Args:
+            impact_factor: Market-impact scaling factor.
+            timing_factor: Timing-cost scaling factor.
+            adv_lookback: Look-back periods for ADV estimation.
+        """
+        self.impact_factor = impact_factor
+        self.timing_factor = timing_factor
+        self.adv_lookback = adv_lookback
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def predict(
+        self,
+        order_size: float,
+        avg_daily_volume: float,
+        spread_bps: float,
+        volatility: float,
+        urgency: float = 0.5,
+    ) -> dict[str, float]:
+        """Predict total slippage for a trade.
+
+        Args:
+            order_size: Order size (same units as *avg_daily_volume*).
+            avg_daily_volume: Average daily traded volume.
+            spread_bps: Current bid-ask spread in basis points.
+            volatility: Intraday volatility as a fraction (e.g., 0.01 = 1%).
+            urgency: Execution urgency in [0, 1].  Higher values cause faster
+                (more impactful) execution.
+
+        Returns:
+            Dict with keys ``spread_cost_bps``, ``impact_cost_bps``,
+            ``timing_cost_bps``, ``total_slippage_bps``.
+
+        Raises:
+            ValueError: If avg_daily_volume is zero or negative.
+        """
+        if avg_daily_volume <= 0:
+            raise ValueError("avg_daily_volume must be positive.")
+
+        participation_rate = min(order_size / avg_daily_volume, 1.0)
+
+        spread_cost = spread_bps / 2.0
+        impact_cost = (
+            self.impact_factor
+            * volatility
+            * np.sqrt(participation_rate)
+            * 10_000
+        )
+        timing_cost = self.timing_factor * volatility * urgency * 10_000
+
+        total = spread_cost + impact_cost + timing_cost
+
+        result = {
+            "spread_cost_bps": round(spread_cost, 4),
+            "impact_cost_bps": round(float(impact_cost), 4),
+            "timing_cost_bps": round(float(timing_cost), 4),
+            "total_slippage_bps": round(float(total), 4),
+        }
+        logger.debug(f"Slippage estimate: {result}")
+        return result
+
+    def predict_from_history(
+        self,
+        order_size: float,
+        volume_history: Any,
+        price_history: Any,
+        spread_bps: float = 5.0,
+        urgency: float = 0.5,
+    ) -> dict[str, float]:
+        """Predict slippage using historical volume and price series.
+
+        Args:
+            order_size: Order size.
+            volume_history: Array-like of historical volume observations.
+            price_history: Array-like of historical close prices.
+            spread_bps: Current spread in basis points.
+            urgency: Execution urgency in [0, 1].
+
+        Returns:
+            Slippage estimate dict (same keys as :meth:`predict`).
+        """
+        vols = np.asarray(volume_history, dtype=np.float64)
+        prices = np.asarray(price_history, dtype=np.float64)
+
+        adv = float(np.mean(vols[-self.adv_lookback:]))
+
+        returns = np.diff(prices) / prices[:-1]
+        volatility = float(np.std(returns, ddof=1)) if len(returns) >= 2 else 0.01
+
+        return self.predict(order_size, adv, spread_bps, volatility, urgency)
diff --git a/vertical-ai/execution/smart_order_router.py b/vertical-ai/execution/smart_order_router.py
new file mode 100644
index 0000000..9dfb08a
--- /dev/null
+++ b/vertical-ai/execution/smart_order_router.py
@@ -0,0 +1,241 @@
+"""Smart order routing: optimal execution path selection.
+
+Provides :class:`SmartOrderRouter` which selects and sequences execution
+venues to minimise market impact and transaction costs.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from dataclasses import dataclass, field
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+@dataclass
+class Venue:
+    """Represents a trading venue or liquidity pool.
+
+    Attributes:
+        name: Venue identifier.
+        available_liquidity: Available shares / contracts at this venue.
+        fee_bps: Transaction fee in basis points.
+        latency_ms: Estimated round-trip latency in milliseconds.
+        fill_probability: Empirical probability of order fill at this venue.
+    """
+
+    name: str
+    available_liquidity: float
+    fee_bps: float
+    latency_ms: float
+    fill_probability: float = 0.95
+
+
+@dataclass
+class RoutingPlan:
+    """Describes how an order should be split across venues.
+
+    Attributes:
+        venues: Ordered list of venues to use.
+        allocations: Shares to send to each venue (same order as venues).
+        estimated_cost_bps: Expected total transaction cost in basis points.
+        estimated_fill_rate: Expected fraction of order filled.
+    """
+
+    venues: list[str]
+    allocations: list[float]
+    estimated_cost_bps: float
+    estimated_fill_rate: float
+    metadata: dict[str, Any] = field(default_factory=dict)
+
+
+class SmartOrderRouter:
+    """Route orders optimally across available trading venues.
+
+    Uses a simple cost-minimisation heuristic that balances transaction fees,
+    market impact, and fill probability to construct a routing plan.
+
+    Attributes:
+        venues: Registered trading venues.
+        impact_coefficient: Coefficient for the linear market-impact penalty.
+        max_venues: Maximum number of venues to include in a routing plan.
+    """
+
+    def __init__(
+        self,
+        venues: list[dict[str, Any]] | None = None,
+        impact_coefficient: float = 0.1,
+        max_venues: int = 3,
+    ) -> None:
+        """Initialise SmartOrderRouter.
+
+        Args:
+            venues: List of venue configuration dicts.  Each dict should
+                contain keys matching :class:`Venue` field names.
+            impact_coefficient: Linear market-impact cost coefficient.
+            max_venues: Maximum venues to split an order across.
+        """
+        default_venues = [
+            Venue("PRIMARY", 100_000, 0.5, 1.0, 0.98),
+            Venue("DARK_POOL", 50_000, 0.2, 5.0, 0.80),
+            Venue("ECN_1", 75_000, 0.3, 2.0, 0.92),
+            Venue("ECN_2", 60_000, 0.35, 2.5, 0.90),
+        ]
+        if venues:
+            self.venues: list[Venue] = [Venue(**v) for v in venues]
+        else:
+            self.venues = default_venues
+
+        self.impact_coefficient = impact_coefficient
+        self.max_venues = max_venues
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _venue_cost_score(
+        self, venue: Venue, order_fraction: float
+    ) -> float:
+        """Compute a cost score for sending *order_fraction* to *venue*.
+
+        Lower scores are better.
+
+        Args:
+            venue: Venue object.
+            order_fraction: Fraction of total order (0–1).
+
+        Returns:
+            Cost score (bps equivalent).
+        """
+        fee = venue.fee_bps
+        impact = self.impact_coefficient * order_fraction * 100
+        fill_penalty = (1 - venue.fill_probability) * 50
+        latency_penalty = venue.latency_ms * 0.01
+        return fee + impact + fill_penalty + latency_penalty
+
+    def _allocate(
+        self, order_size: float, eligible_venues: list[Venue]
+    ) -> list[float]:
+        """Greedy allocation: fill venues in order of available liquidity.
+
+        Args:
+            order_size: Total order size.
+            eligible_venues: Venues sorted by preference.
+
+        Returns:
+            List of allocation amounts matching venue order.
+        """
+        allocations: list[float] = []
+        remaining = order_size
+        for v in eligible_venues:
+            alloc = min(remaining, v.available_liquidity)
+            allocations.append(alloc)
+            remaining -= alloc
+            if remaining <= 0:
+                break
+        while len(allocations) < len(eligible_venues):
+            allocations.append(0.0)
+        return allocations
+
+    # ------------------------------------------------------------------
+    # Public async interface
+    # ------------------------------------------------------------------
+
+    async def route(
+        self,
+        order_size: float,
+        side: str,
+        urgency: str = "normal",
+        market_conditions: dict[str, Any] | None = None,
+    ) -> RoutingPlan:
+        """Compute an optimal routing plan for an order.
+
+        Args:
+            order_size: Order size in shares / contracts.
+            side: ``"buy"`` or ``"sell"``.
+            urgency: ``"low"``, ``"normal"``, or ``"high"``.  Higher urgency
+                favours low-latency venues even if they cost more.
+            market_conditions: Optional dict with keys like ``volatility`` and
+                ``spread_bps`` to adjust impact estimates.
+
+        Returns:
+            :class:`RoutingPlan` with venue allocations and cost estimates.
+
+        Raises:
+            ValueError: If side is not ``"buy"`` or ``"sell"``.
+        """
+        if side not in ("buy", "sell"):
+            raise ValueError("side must be 'buy' or 'sell'.")
+
+        loop = asyncio.get_event_loop()
+        return await loop.run_in_executor(
+            None, self._compute_plan, order_size, side, urgency, market_conditions or {}
+        )
+
+    def _compute_plan(
+        self,
+        order_size: float,
+        side: str,
+        urgency: str,
+        market_conditions: dict[str, Any],
+    ) -> RoutingPlan:
+        """Synchronous routing plan computation.
+
+        Args:
+            order_size: Order size.
+            side: Order side.
+            urgency: Urgency level.
+            market_conditions: Market context dict.
+
+        Returns:
+            Routing plan.
+        """
+        logger.debug(f"Routing {side} order size={order_size}, urgency={urgency}")
+
+        vol = market_conditions.get("volatility", 0.01)
+        spread_bps = market_conditions.get("spread_bps", 5.0)
+
+        # Sort venues by cost score; use latency tie-break for high urgency
+        scored: list[tuple[float, Venue]] = []
+        for v in self.venues:
+            if v.available_liquidity <= 0:
+                continue
+            frac = min(order_size, v.available_liquidity) / (order_size + 1e-9)
+            score = self._venue_cost_score(v, frac)
+            if urgency == "high":
+                score += v.latency_ms * 0.1
+            scored.append((score, v))
+
+        scored.sort(key=lambda x: x[0])
+        eligible = [v for _, v in scored[: self.max_venues]]
+
+        allocations = self._allocate(order_size, eligible)
+        total_allocated = sum(allocations)
+
+        # Estimated costs
+        total_cost_bps = sum(
+            self._venue_cost_score(v, alloc / (order_size + 1e-9))
+            for v, alloc in zip(eligible, allocations)
+            if alloc > 0
+        )
+        fill_probs = [
+            v.fill_probability for v, alloc in zip(eligible, allocations) if alloc > 0
+        ]
+        est_fill_rate = float(np.mean(fill_probs)) if fill_probs else 0.0
+
+        plan = RoutingPlan(
+            venues=[v.name for v in eligible],
+            allocations=allocations,
+            estimated_cost_bps=round(total_cost_bps, 4),
+            estimated_fill_rate=round(est_fill_rate, 4),
+            metadata={
+                "total_allocated": total_allocated,
+                "unfilled": max(0.0, order_size - total_allocated),
+                "volatility": vol,
+                "spread_bps": spread_bps,
+            },
+        )
+        logger.debug(f"Routing plan: {plan.venues}, cost={plan.estimated_cost_bps:.2f}bps")
+        return plan
diff --git a/vertical-ai/market_analysis/__init__.py b/vertical-ai/market_analysis/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/vertical-ai/market_analysis/__pycache__/__init__.cpython-312.pyc b/vertical-ai/market_analysis/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..5f98f07
Binary files /dev/null and b/vertical-ai/market_analysis/__pycache__/__init__.cpython-312.pyc differ
diff --git a/vertical-ai/market_analysis/__pycache__/fundamental_analyzer.cpython-312.pyc b/vertical-ai/market_analysis/__pycache__/fundamental_analyzer.cpython-312.pyc
new file mode 100644
index 0000000..b8bda8d
Binary files /dev/null and b/vertical-ai/market_analysis/__pycache__/fundamental_analyzer.cpython-312.pyc differ
diff --git a/vertical-ai/market_analysis/__pycache__/orderbook_analyzer.cpython-312.pyc b/vertical-ai/market_analysis/__pycache__/orderbook_analyzer.cpython-312.pyc
new file mode 100644
index 0000000..770aa9e
Binary files /dev/null and b/vertical-ai/market_analysis/__pycache__/orderbook_analyzer.cpython-312.pyc differ
diff --git a/vertical-ai/market_analysis/__pycache__/sentiment_analyzer.cpython-312.pyc b/vertical-ai/market_analysis/__pycache__/sentiment_analyzer.cpython-312.pyc
new file mode 100644
index 0000000..02c19bc
Binary files /dev/null and b/vertical-ai/market_analysis/__pycache__/sentiment_analyzer.cpython-312.pyc differ
diff --git a/vertical-ai/market_analysis/__pycache__/technical_analyzer.cpython-312.pyc b/vertical-ai/market_analysis/__pycache__/technical_analyzer.cpython-312.pyc
new file mode 100644
index 0000000..7f485df
Binary files /dev/null and b/vertical-ai/market_analysis/__pycache__/technical_analyzer.cpython-312.pyc differ
diff --git a/vertical-ai/market_analysis/fundamental_analyzer.py b/vertical-ai/market_analysis/fundamental_analyzer.py
new file mode 100644
index 0000000..78b0538
--- /dev/null
+++ b/vertical-ai/market_analysis/fundamental_analyzer.py
@@ -0,0 +1,169 @@
+"""Fundamental analysis: financial ratio computation and scoring.
+
+Provides the :class:`FundamentalAnalyzer` for evaluating company financials
+through common valuation and health ratios.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+from loguru import logger
+
+
+class FundamentalAnalyzer:
+    """Analyse company financial data through standard valuation ratios.
+
+    Computes valuation (P/E, P/B, EV/EBITDA), profitability (ROE, ROA, profit
+    margin), and leverage (debt-to-equity, current ratio, interest coverage)
+    metrics from raw financial statement data.
+
+    Attributes:
+        thresholds: Dict of ratio name → (low_threshold, high_threshold)
+            used to tag ratios as ``"undervalued"``, ``"fair"``, or
+            ``"overvalued"``/``"risky"``.
+    """
+
+    _DEFAULT_THRESHOLDS: dict[str, tuple[float, float]] = {
+        "pe_ratio": (0.0, 25.0),
+        "pb_ratio": (0.0, 3.0),
+        "ev_ebitda": (0.0, 15.0),
+        "roe": (0.10, 0.30),
+        "roa": (0.05, 0.20),
+        "profit_margin": (0.05, 0.30),
+        "debt_to_equity": (0.0, 1.0),
+        "current_ratio": (1.5, 3.0),
+        "interest_coverage": (3.0, 10.0),
+    }
+
+    def __init__(
+        self,
+        thresholds: dict[str, tuple[float, float]] | None = None,
+    ) -> None:
+        """Initialise FundamentalAnalyzer.
+
+        Args:
+            thresholds: Override default ratio threshold bands.  Each entry
+                maps a ratio name to ``(min_good, max_good)`` bounds.
+        """
+        self.thresholds: dict[str, tuple[float, float]] = {
+            **self._DEFAULT_THRESHOLDS,
+            **(thresholds or {}),
+        }
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def _safe_div(numerator: float, denominator: float, default: float = float("nan")) -> float:
+        """Return numerator / denominator, or *default* on zero-division.
+
+        Args:
+            numerator: Dividend value.
+            denominator: Divisor value.
+            default: Fallback when denominator is zero.
+
+        Returns:
+            Computed ratio or *default*.
+        """
+        if denominator == 0:
+            return default
+        return numerator / denominator
+
+    def _score_ratio(self, name: str, value: float) -> str:
+        """Classify a ratio as ``healthy``, ``low``, or ``high``.
+
+        Args:
+            name: Ratio name (must exist in :attr:`thresholds`).
+            value: Computed ratio value.
+
+        Returns:
+            Classification string.
+        """
+        if name not in self.thresholds:
+            return "unknown"
+        low, high = self.thresholds[name]
+        if value < low:
+            return "low"
+        if value > high:
+            return "high"
+        return "healthy"
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def analyze_fundamentals(self, financial_data: dict[str, Any]) -> dict[str, Any]:
+        """Compute financial ratios from raw statement data.
+
+        Args:
+            financial_data: Dict containing any subset of the following keys:
+
+                * ``price`` – current stock price
+                * ``eps`` – earnings per share
+                * ``book_value_per_share`` – book value per share
+                * ``net_income`` – net income
+                * ``revenue`` – total revenue
+                * ``total_equity`` – shareholders' equity
+                * ``total_assets`` – total assets
+                * ``total_debt`` – total debt
+                * ``current_assets`` – current assets
+                * ``current_liabilities`` – current liabilities
+                * ``ebit`` – EBIT
+                * ``interest_expense`` – interest expense
+                * ``enterprise_value`` – enterprise value
+                * ``ebitda`` – EBITDA
+
+        Returns:
+            Dict with keys ``ratios`` (computed float values) and ``scores``
+            (classification strings for each ratio).
+
+        Raises:
+            TypeError: If *financial_data* is not a dict.
+        """
+        if not isinstance(financial_data, dict):
+            raise TypeError(f"financial_data must be a dict, got {type(financial_data)}")
+
+        logger.debug("Computing fundamental ratios")
+        fd = financial_data
+
+        ratios: dict[str, float] = {}
+
+        # Valuation
+        ratios["pe_ratio"] = self._safe_div(
+            fd.get("price", 0.0), fd.get("eps", 0.0)
+        )
+        ratios["pb_ratio"] = self._safe_div(
+            fd.get("price", 0.0), fd.get("book_value_per_share", 0.0)
+        )
+        ratios["ev_ebitda"] = self._safe_div(
+            fd.get("enterprise_value", 0.0), fd.get("ebitda", 0.0)
+        )
+
+        # Profitability
+        ratios["roe"] = self._safe_div(
+            fd.get("net_income", 0.0), fd.get("total_equity", 0.0)
+        )
+        ratios["roa"] = self._safe_div(
+            fd.get("net_income", 0.0), fd.get("total_assets", 0.0)
+        )
+        ratios["profit_margin"] = self._safe_div(
+            fd.get("net_income", 0.0), fd.get("revenue", 0.0)
+        )
+
+        # Leverage / liquidity
+        ratios["debt_to_equity"] = self._safe_div(
+            fd.get("total_debt", 0.0), fd.get("total_equity", 0.0)
+        )
+        ratios["current_ratio"] = self._safe_div(
+            fd.get("current_assets", 0.0), fd.get("current_liabilities", 0.0)
+        )
+        ratios["interest_coverage"] = self._safe_div(
+            fd.get("ebit", 0.0), fd.get("interest_expense", 0.0)
+        )
+
+        scores = {name: self._score_ratio(name, val) for name, val in ratios.items()}
+
+        logger.debug(f"Fundamental analysis complete: {len(ratios)} ratios computed")
+        return {"ratios": ratios, "scores": scores}
diff --git a/vertical-ai/market_analysis/orderbook_analyzer.py b/vertical-ai/market_analysis/orderbook_analyzer.py
new file mode 100644
index 0000000..7acf5ec
--- /dev/null
+++ b/vertical-ai/market_analysis/orderbook_analyzer.py
@@ -0,0 +1,234 @@
+"""Order-book analysis: market depth, bid-ask imbalance, and liquidity scoring.
+
+Provides :class:`OrderBookAnalyzer` for real-time microstructure metrics.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class OrderBookAnalyzer:
+    """Analyse Level-2 order-book snapshots for microstructure metrics.
+
+    Computes bid-ask spread, depth imbalance, weighted mid-price, and a
+    composite liquidity score from raw order-book data.
+
+    Attributes:
+        depth_levels: Number of price levels to consider when computing
+            liquidity and imbalance metrics.
+        imbalance_alpha: Exponential smoothing factor for rolling imbalance.
+    """
+
+    def __init__(
+        self,
+        depth_levels: int = 10,
+        imbalance_alpha: float = 0.1,
+    ) -> None:
+        """Initialise OrderBookAnalyzer.
+
+        Args:
+            depth_levels: How many top price levels to include in analysis.
+            imbalance_alpha: EMA smoothing factor for running imbalance
+                estimate (0 < alpha ≤ 1).
+        """
+        if not 0 < imbalance_alpha <= 1:
+            raise ValueError("imbalance_alpha must be in (0, 1].")
+        self.depth_levels = depth_levels
+        self.imbalance_alpha = imbalance_alpha
+        self._running_imbalance: float | None = None
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def _validate_side(
+        side: list[list[float]], name: str
+    ) -> tuple[np.ndarray, np.ndarray]:
+        """Parse and validate one side of the order book.
+
+        Args:
+            side: List of ``[price, size]`` pairs.
+            name: ``"bids"`` or ``"asks"`` (for error messages).
+
+        Returns:
+            Tuple of (prices, sizes) as float64 arrays.
+
+        Raises:
+            ValueError: If the side is empty or malformed.
+        """
+        if not side:
+            raise ValueError(f"Order book '{name}' must not be empty.")
+        arr = np.asarray(side, dtype=np.float64)
+        if arr.ndim != 2 or arr.shape[1] < 2:
+            raise ValueError(f"Each '{name}' entry must be [price, size].")
+        return arr[:, 0], arr[:, 1]
+
+    def _best_bid_ask(
+        self,
+        bid_prices: np.ndarray,
+        ask_prices: np.ndarray,
+    ) -> tuple[float, float]:
+        """Return best bid and best ask prices.
+
+        Args:
+            bid_prices: All bid price levels.
+            ask_prices: All ask price levels.
+
+        Returns:
+            Tuple of (best_bid, best_ask).
+        """
+        return float(np.max(bid_prices)), float(np.min(ask_prices))
+
+    def _weighted_mid_price(
+        self,
+        best_bid: float,
+        best_ask: float,
+        bid_size_at_best: float,
+        ask_size_at_best: float,
+    ) -> float:
+        """Compute size-weighted mid-price.
+
+        Args:
+            best_bid: Best bid price.
+            best_ask: Best ask price.
+            bid_size_at_best: Size at best bid.
+            ask_size_at_best: Size at best ask.
+
+        Returns:
+            Weighted mid-price.
+        """
+        total = bid_size_at_best + ask_size_at_best
+        if total == 0:
+            return (best_bid + best_ask) / 2.0
+        return (best_bid * ask_size_at_best + best_ask * bid_size_at_best) / total
+
+    def _liquidity_score(
+        self,
+        bid_prices: np.ndarray,
+        bid_sizes: np.ndarray,
+        ask_prices: np.ndarray,
+        ask_sizes: np.ndarray,
+        spread: float,
+        mid: float,
+    ) -> float:
+        """Compute a composite liquidity score in [0, 1].
+
+        Combines spread tightness, total depth, and level count into a single
+        normalised metric.
+
+        Args:
+            bid_prices: Bid price levels.
+            bid_sizes: Bid size levels.
+            ask_prices: Ask price levels.
+            ask_sizes: Ask size levels.
+            spread: Absolute bid-ask spread.
+            mid: Mid-price.
+
+        Returns:
+            Liquidity score (higher is more liquid).
+        """
+        n = self.depth_levels
+        bid_depth = np.sum(bid_sizes[:n]) if len(bid_sizes) >= n else np.sum(bid_sizes)
+        ask_depth = np.sum(ask_sizes[:n]) if len(ask_sizes) >= n else np.sum(ask_sizes)
+        total_depth = bid_depth + ask_depth
+
+        spread_score = 1.0 / (1.0 + spread / (mid + 1e-9) * 100)
+        depth_score = np.tanh(total_depth / 1000.0)
+
+        return float(np.clip(0.5 * spread_score + 0.5 * depth_score, 0.0, 1.0))
+
+    # ------------------------------------------------------------------
+    # Public async interface
+    # ------------------------------------------------------------------
+
+    async def analyze(self, orderbook: dict[str, Any]) -> dict[str, Any]:
+        """Analyse an order-book snapshot asynchronously.
+
+        Args:
+            orderbook: Dict with keys:
+
+                * ``bids`` – list of ``[price, size]`` pairs sorted
+                  descending by price.
+                * ``asks`` – list of ``[price, size]`` pairs sorted
+                  ascending by price.
+
+        Returns:
+            Dict with keys ``best_bid``, ``best_ask``, ``spread``,
+            ``spread_bps``, ``mid_price``, ``weighted_mid_price``,
+            ``bid_ask_imbalance``, ``total_bid_depth``, ``total_ask_depth``,
+            ``liquidity_score``.
+
+        Raises:
+            KeyError: If ``bids`` or ``asks`` keys are absent.
+            ValueError: If order-book data is malformed.
+        """
+        for key in ("bids", "asks"):
+            if key not in orderbook:
+                raise KeyError(f"Order book missing required key: '{key}'")
+
+        loop = asyncio.get_event_loop()
+        return await loop.run_in_executor(None, self._compute_metrics, orderbook)
+
+    def _compute_metrics(self, orderbook: dict[str, Any]) -> dict[str, Any]:
+        """Synchronous metric computation.
+
+        Args:
+            orderbook: Validated order-book dict.
+
+        Returns:
+            Metrics dict.
+        """
+        logger.debug("Computing order-book metrics")
+        bid_prices, bid_sizes = self._validate_side(orderbook["bids"], "bids")
+        ask_prices, ask_sizes = self._validate_side(orderbook["asks"], "asks")
+
+        best_bid, best_ask = self._best_bid_ask(bid_prices, ask_prices)
+        spread = best_ask - best_bid
+        mid = (best_bid + best_ask) / 2.0
+        spread_bps = (spread / mid) * 10_000 if mid > 0 else 0.0
+
+        bid_best_idx = int(np.argmax(bid_prices))
+        ask_best_idx = int(np.argmin(ask_prices))
+        wmid = self._weighted_mid_price(
+            best_bid, best_ask,
+            float(bid_sizes[bid_best_idx]),
+            float(ask_sizes[ask_best_idx]),
+        )
+
+        n = self.depth_levels
+        total_bid = float(np.sum(bid_sizes[:n]))
+        total_ask = float(np.sum(ask_sizes[:n]))
+        imbalance = (total_bid - total_ask) / (total_bid + total_ask + 1e-9)
+
+        # Update exponential running imbalance
+        if self._running_imbalance is None:
+            self._running_imbalance = imbalance
+        else:
+            self._running_imbalance = (
+                self.imbalance_alpha * imbalance
+                + (1 - self.imbalance_alpha) * self._running_imbalance
+            )
+
+        liq = self._liquidity_score(
+            bid_prices, bid_sizes, ask_prices, ask_sizes, spread, mid
+        )
+
+        return {
+            "best_bid": best_bid,
+            "best_ask": best_ask,
+            "spread": spread,
+            "spread_bps": round(spread_bps, 4),
+            "mid_price": mid,
+            "weighted_mid_price": wmid,
+            "bid_ask_imbalance": round(imbalance, 6),
+            "running_imbalance": round(self._running_imbalance, 6),
+            "total_bid_depth": total_bid,
+            "total_ask_depth": total_ask,
+            "liquidity_score": round(liq, 4),
+        }
diff --git a/vertical-ai/market_analysis/sentiment_analyzer.py b/vertical-ai/market_analysis/sentiment_analyzer.py
new file mode 100644
index 0000000..e1ded74
--- /dev/null
+++ b/vertical-ai/market_analysis/sentiment_analyzer.py
@@ -0,0 +1,242 @@
+"""Sentiment analysis: news and social-media text scoring.
+
+Provides :class:`SentimentAnalyzer` which uses a lexicon-based approach with
+weighted averaging to produce a sentiment score in [-1, 1].
+"""
+
+from __future__ import annotations
+
+import re
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+# ---------------------------------------------------------------------------
+# Minimal built-in lexicon (finance-domain keywords)
+# ---------------------------------------------------------------------------
+
+_POSITIVE_WORDS: frozenset[str] = frozenset(
+    [
+        "bullish", "rally", "surge", "gain", "profit", "growth", "beat",
+        "outperform", "upgrade", "strong", "record", "breakthrough", "positive",
+        "optimistic", "recovery", "boom", "buy", "upside", "expansion", "rise",
+        "soar", "high", "robust", "confident", "dividend", "upbeat", "exceed",
+        "accelerate", "improve", "advance", "momentum",
+    ]
+)
+
+_NEGATIVE_WORDS: frozenset[str] = frozenset(
+    [
+        "bearish", "crash", "plunge", "loss", "decline", "miss", "downgrade",
+        "weak", "concern", "risk", "fear", "sell", "cut", "drop", "fall",
+        "slump", "debt", "default", "recession", "inflation", "warning",
+        "disappointing", "underperform", "volatile", "uncertainty", "downturn",
+        "restructure", "layoff", "bankruptcy", "lawsuit", "fraud",
+    ]
+)
+
+_NEGATION_WORDS: frozenset[str] = frozenset(
+    ["not", "no", "never", "neither", "nor", "hardly", "barely", "scarcely"]
+)
+
+_INTENSIFIER_WORDS: dict[str, float] = {
+    "very": 1.5,
+    "extremely": 2.0,
+    "significantly": 1.5,
+    "slightly": 0.5,
+    "somewhat": 0.7,
+    "highly": 1.5,
+    "major": 1.5,
+    "minor": 0.5,
+}
+
+
+class SentimentAnalyzer:
+    """Lexicon-based sentiment scorer for financial text.
+
+    Scores individual tokens using a finance-domain lexicon, applies negation
+    and intensifier modifiers, then aggregates across multiple documents using
+    a configurable weighting scheme.
+
+    Attributes:
+        positive_words: Set of positive sentiment words.
+        negative_words: Set of negative sentiment words.
+        negation_window: Number of tokens after a negation word where
+            sentiment is flipped.
+        default_weights: Weighting strategy (``"uniform"`` or ``"recency"``).
+    """
+
+    def __init__(
+        self,
+        positive_words: frozenset[str] | None = None,
+        negative_words: frozenset[str] | None = None,
+        negation_window: int = 3,
+        default_weights: str = "uniform",
+    ) -> None:
+        """Initialise SentimentAnalyzer.
+
+        Args:
+            positive_words: Override default positive lexicon.
+            negative_words: Override default negative lexicon.
+            negation_window: Token window after a negation word where polarity
+                is flipped.
+            default_weights: ``"uniform"`` (equal weight per document) or
+                ``"recency"`` (more-recent docs weighted higher).
+        """
+        self.positive_words = positive_words or _POSITIVE_WORDS
+        self.negative_words = negative_words or _NEGATIVE_WORDS
+        self.negation_window = negation_window
+        self.default_weights = default_weights
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def _tokenize(text: str) -> list[str]:
+        """Lower-case and split text into word tokens.
+
+        Args:
+            text: Raw input string.
+
+        Returns:
+            List of lower-cased word tokens.
+        """
+        return re.findall(r"[a-z]+", text.lower())
+
+    def _score_text(self, text: str) -> float:
+        """Score a single text document.
+
+        Applies negation window and intensifier multipliers.
+
+        Args:
+            text: Raw text string.
+
+        Returns:
+            Raw sentiment score (can exceed [-1, 1] before normalisation).
+        """
+        tokens = self._tokenize(text)
+        score = 0.0
+        negation_count = 0
+        intensifier = 1.0
+
+        for token in tokens:
+            if token in _NEGATION_WORDS:
+                negation_count = self.negation_window
+                continue
+
+            if token in _INTENSIFIER_WORDS:
+                intensifier = _INTENSIFIER_WORDS[token]
+                continue
+
+            polarity = 0.0
+            if token in self.positive_words:
+                polarity = 1.0
+            elif token in self.negative_words:
+                polarity = -1.0
+
+            if polarity != 0.0:
+                if negation_count > 0:
+                    polarity *= -1.0
+                score += polarity * intensifier
+
+            if negation_count > 0:
+                negation_count -= 1
+            intensifier = 1.0  # reset after each scored word
+
+        return score
+
+    @staticmethod
+    def _normalise(score: float, n_tokens: int) -> float:
+        """Normalise raw score to [-1, 1].
+
+        Args:
+            score: Accumulated raw score.
+            n_tokens: Number of tokens in the document.
+
+        Returns:
+            Score clamped to [-1, 1].
+        """
+        if n_tokens == 0:
+            return 0.0
+        normalised = score / n_tokens
+        return float(np.clip(normalised, -1.0, 1.0))
+
+    def _build_weights(self, n: int, strategy: str) -> np.ndarray:
+        """Build a weight vector for *n* documents.
+
+        Args:
+            n: Number of documents.
+            strategy: ``"uniform"`` or ``"recency"``.
+
+        Returns:
+            Normalised weight array of shape ``(n,)``.
+        """
+        if strategy == "recency":
+            weights = np.arange(1, n + 1, dtype=float)
+        else:
+            weights = np.ones(n, dtype=float)
+        return weights / weights.sum()
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def analyze_sentiment(
+        self,
+        texts: list[str],
+        weights: list[float] | None = None,
+    ) -> dict[str, Any]:
+        """Compute aggregate sentiment score across a list of text documents.
+
+        Args:
+            texts: List of text strings (news headlines, tweets, etc.).
+            weights: Optional per-document weights.  Must sum to 1 if provided.
+                If ``None``, uses :attr:`default_weights` strategy.
+
+        Returns:
+            Dict with keys:
+
+            * ``score`` – aggregate sentiment in [-1, 1]
+            * ``individual_scores`` – per-document scores
+            * ``label`` – ``"positive"``, ``"negative"``, or ``"neutral"``
+
+        Raises:
+            ValueError: If *texts* is empty or *weights* length mismatches.
+        """
+        if not texts:
+            raise ValueError("texts must be a non-empty list of strings.")
+
+        individual: list[float] = []
+        for text in texts:
+            tokens = self._tokenize(text)
+            raw = self._score_text(text)
+            individual.append(self._normalise(raw, max(len(tokens), 1)))
+
+        if weights is not None:
+            if len(weights) != len(texts):
+                raise ValueError(
+                    f"weights length ({len(weights)}) != texts length ({len(texts)})"
+                )
+            w = np.asarray(weights, dtype=float)
+            w = w / w.sum()
+        else:
+            w = self._build_weights(len(texts), self.default_weights)
+
+        aggregate = float(np.dot(w, individual))
+
+        if aggregate > 0.05:
+            label = "positive"
+        elif aggregate < -0.05:
+            label = "negative"
+        else:
+            label = "neutral"
+
+        logger.debug(f"Sentiment analysis: {len(texts)} docs → score={aggregate:.4f} ({label})")
+        return {
+            "score": aggregate,
+            "individual_scores": individual,
+            "label": label,
+        }
diff --git a/vertical-ai/market_analysis/technical_analyzer.py b/vertical-ai/market_analysis/technical_analyzer.py
new file mode 100644
index 0000000..7c953d2
--- /dev/null
+++ b/vertical-ai/market_analysis/technical_analyzer.py
@@ -0,0 +1,312 @@
+"""Technical analysis: chart patterns and price indicators.
+
+Provides the :class:`TechnicalAnalyzer` which computes common technical
+indicators from OHLCV data using pure NumPy arithmetic.
+"""
+
+from __future__ import annotations
+
+import asyncio
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class TechnicalAnalyzer:
+    """Compute technical indicators and detect chart patterns from OHLCV data.
+
+    All heavy computation is delegated to NumPy vectorised operations so the
+    class remains dependency-light while staying numerically correct.
+
+    Attributes:
+        sma_periods: Periods for Simple Moving Average computation.
+        ema_periods: Periods for Exponential Moving Average computation.
+        rsi_period: Look-back period for RSI.
+        bb_period: Look-back period for Bollinger Bands.
+        bb_std: Number of standard deviations for Bollinger Band width.
+        atr_period: Look-back period for ATR.
+        macd_fast: Fast EMA period for MACD.
+        macd_slow: Slow EMA period for MACD.
+        macd_signal: Signal EMA period for MACD.
+    """
+
+    def __init__(
+        self,
+        sma_periods: list[int] | None = None,
+        ema_periods: list[int] | None = None,
+        rsi_period: int = 14,
+        bb_period: int = 20,
+        bb_std: float = 2.0,
+        atr_period: int = 14,
+        macd_fast: int = 12,
+        macd_slow: int = 26,
+        macd_signal: int = 9,
+    ) -> None:
+        """Initialise TechnicalAnalyzer with indicator parameters.
+
+        Args:
+            sma_periods: List of SMA look-back periods. Defaults to [20, 50, 200].
+            ema_periods: List of EMA look-back periods. Defaults to [12, 26].
+            rsi_period: RSI look-back period.
+            bb_period: Bollinger Band look-back period.
+            bb_std: Bollinger Band standard-deviation multiplier.
+            atr_period: ATR look-back period.
+            macd_fast: MACD fast EMA period.
+            macd_slow: MACD slow EMA period.
+            macd_signal: MACD signal-line EMA period.
+        """
+        self.sma_periods = sma_periods or [20, 50, 200]
+        self.ema_periods = ema_periods or [12, 26]
+        self.rsi_period = rsi_period
+        self.bb_period = bb_period
+        self.bb_std = bb_std
+        self.atr_period = atr_period
+        self.macd_fast = macd_fast
+        self.macd_slow = macd_slow
+        self.macd_signal = macd_signal
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def _to_array(data: Any) -> np.ndarray:
+        """Convert input to a float64 NumPy array.
+
+        Args:
+            data: Any array-like structure.
+
+        Returns:
+            1-D float64 NumPy array.
+
+        Raises:
+            ValueError: If conversion produces an empty array.
+        """
+        arr = np.asarray(data, dtype=np.float64)
+        if arr.ndim != 1 or arr.size == 0:
+            raise ValueError("Expected a non-empty 1-D array-like input.")
+        return arr
+
+    def _ema(self, prices: np.ndarray, period: int) -> np.ndarray:
+        """Compute Exponential Moving Average.
+
+        Args:
+            prices: 1-D price array.
+            period: Look-back period.
+
+        Returns:
+            EMA values array of the same length as *prices* (initial values
+            are NaN until enough data is available).
+        """
+        k = 2.0 / (period + 1)
+        ema = np.full(len(prices), np.nan)
+        # seed with simple average of the first *period* values
+        if len(prices) < period:
+            return ema
+        ema[period - 1] = np.mean(prices[:period])
+        for i in range(period, len(prices)):
+            ema[i] = prices[i] * k + ema[i - 1] * (1 - k)
+        return ema
+
+    def _sma(self, prices: np.ndarray, period: int) -> np.ndarray:
+        """Compute Simple Moving Average using a sliding window.
+
+        Args:
+            prices: 1-D price array.
+            period: Look-back period.
+
+        Returns:
+            SMA array (NaN for indices < period − 1).
+        """
+        sma = np.full(len(prices), np.nan)
+        if len(prices) < period:
+            return sma
+        cumsum = np.cumsum(prices)
+        sma[period - 1:] = (
+            cumsum[period - 1:]
+            - np.concatenate(([0.0], cumsum[: len(prices) - period]))
+        ) / period
+        return sma
+
+    def _rsi(self, prices: np.ndarray) -> np.ndarray:
+        """Compute Relative Strength Index.
+
+        Args:
+            prices: 1-D close price array.
+
+        Returns:
+            RSI array in the range [0, 100].
+        """
+        period = self.rsi_period
+        rsi = np.full(len(prices), np.nan)
+        if len(prices) <= period:
+            return rsi
+
+        deltas = np.diff(prices)
+        gains = np.where(deltas > 0, deltas, 0.0)
+        losses = np.where(deltas < 0, -deltas, 0.0)
+
+        avg_gain = np.mean(gains[:period])
+        avg_loss = np.mean(losses[:period])
+
+        for i in range(period, len(prices) - 1):
+            avg_gain = (avg_gain * (period - 1) + gains[i]) / period
+            avg_loss = (avg_loss * (period - 1) + losses[i]) / period
+            rs = avg_gain / avg_loss if avg_loss != 0 else np.inf
+            rsi[i + 1] = 100.0 - (100.0 / (1.0 + rs))
+
+        return rsi
+
+    def _bollinger_bands(
+        self, prices: np.ndarray
+    ) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
+        """Compute Bollinger Bands (upper, middle, lower).
+
+        Args:
+            prices: 1-D close price array.
+
+        Returns:
+            Tuple of (upper_band, middle_band, lower_band) arrays.
+        """
+        middle = self._sma(prices, self.bb_period)
+        std = np.full(len(prices), np.nan)
+        for i in range(self.bb_period - 1, len(prices)):
+            std[i] = np.std(prices[i - self.bb_period + 1: i + 1], ddof=0)
+        upper = middle + self.bb_std * std
+        lower = middle - self.bb_std * std
+        return upper, middle, lower
+
+    def _atr(
+        self, high: np.ndarray, low: np.ndarray, close: np.ndarray
+    ) -> np.ndarray:
+        """Compute Average True Range.
+
+        Args:
+            high: High prices array.
+            low: Low prices array.
+            close: Close prices array.
+
+        Returns:
+            ATR array.
+        """
+        n = len(close)
+        atr = np.full(n, np.nan)
+        if n < 2:
+            return atr
+
+        tr = np.zeros(n)
+        tr[0] = high[0] - low[0]
+        for i in range(1, n):
+            tr[i] = max(
+                high[i] - low[i],
+                abs(high[i] - close[i - 1]),
+                abs(low[i] - close[i - 1]),
+            )
+
+        period = self.atr_period
+        if n < period:
+            return atr
+        atr[period - 1] = np.mean(tr[:period])
+        for i in range(period, n):
+            atr[i] = (atr[i - 1] * (period - 1) + tr[i]) / period
+        return atr
+
+    def _macd(
+        self, prices: np.ndarray
+    ) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
+        """Compute MACD, signal line, and histogram.
+
+        Args:
+            prices: 1-D close price array.
+
+        Returns:
+            Tuple of (macd_line, signal_line, histogram) arrays.
+        """
+        fast_ema = self._ema(prices, self.macd_fast)
+        slow_ema = self._ema(prices, self.macd_slow)
+        macd_line = fast_ema - slow_ema
+        # build signal only where macd_line is valid
+        signal = self._ema(
+            np.where(np.isnan(macd_line), 0.0, macd_line), self.macd_signal
+        )
+        histogram = macd_line - signal
+        return macd_line, signal, histogram
+
+    # ------------------------------------------------------------------
+    # Public async interface
+    # ------------------------------------------------------------------
+
+    async def analyze(self, ohlcv_data: dict[str, Any]) -> dict[str, Any]:
+        """Compute all technical indicators from OHLCV data.
+
+        The computation is CPU-bound; the method uses
+        ``asyncio.get_event_loop().run_in_executor`` to avoid blocking the
+        event loop.
+
+        Args:
+            ohlcv_data: Dict with keys ``open``, ``high``, ``low``, ``close``,
+                ``volume`` each mapped to an array-like of numeric values.
+
+        Returns:
+            Dict of indicator results.  Each value is a list (NaN → None) or
+            a nested dict of lists.
+
+        Raises:
+            KeyError: If a required OHLCV key is missing.
+            ValueError: If arrays are empty or mis-shaped.
+        """
+        required = {"open", "high", "low", "close", "volume"}
+        missing = required - ohlcv_data.keys()
+        if missing:
+            raise KeyError(f"Missing OHLCV keys: {missing}")
+
+        loop = asyncio.get_event_loop()
+        return await loop.run_in_executor(None, self._compute_indicators, ohlcv_data)
+
+    def _compute_indicators(self, ohlcv_data: dict[str, Any]) -> dict[str, Any]:
+        """Synchronous indicator computation (runs in a thread-pool executor).
+
+        Args:
+            ohlcv_data: Validated OHLCV dict.
+
+        Returns:
+            Indicator dict.
+        """
+        logger.debug("Computing technical indicators")
+        close = self._to_array(ohlcv_data["close"])
+        high = self._to_array(ohlcv_data["high"])
+        low = self._to_array(ohlcv_data["low"])
+
+        def to_list(arr: np.ndarray) -> list[float | None]:
+            return [None if np.isnan(v) else float(v) for v in arr]
+
+        sma_results = {
+            f"sma_{p}": to_list(self._sma(close, p)) for p in self.sma_periods
+        }
+        ema_results = {
+            f"ema_{p}": to_list(self._ema(close, p)) for p in self.ema_periods
+        }
+
+        upper_bb, mid_bb, lower_bb = self._bollinger_bands(close)
+        macd_line, signal, histogram = self._macd(close)
+
+        result: dict[str, Any] = {
+            **sma_results,
+            **ema_results,
+            "rsi": to_list(self._rsi(close)),
+            "bollinger_bands": {
+                "upper": to_list(upper_bb),
+                "middle": to_list(mid_bb),
+                "lower": to_list(lower_bb),
+            },
+            "macd": {
+                "macd": to_list(macd_line),
+                "signal": to_list(signal),
+                "histogram": to_list(histogram),
+            },
+            "atr": to_list(self._atr(high, low, close)),
+        }
+
+        logger.debug("Technical indicator computation complete")
+        return result
diff --git a/vertical-ai/risk_management/__init__.py b/vertical-ai/risk_management/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/vertical-ai/risk_management/__pycache__/__init__.cpython-312.pyc b/vertical-ai/risk_management/__pycache__/__init__.cpython-312.pyc
new file mode 100644
index 0000000..142076d
Binary files /dev/null and b/vertical-ai/risk_management/__pycache__/__init__.cpython-312.pyc differ
diff --git a/vertical-ai/risk_management/__pycache__/correlation_analyzer.cpython-312.pyc b/vertical-ai/risk_management/__pycache__/correlation_analyzer.cpython-312.pyc
new file mode 100644
index 0000000..bf4df8a
Binary files /dev/null and b/vertical-ai/risk_management/__pycache__/correlation_analyzer.cpython-312.pyc differ
diff --git a/vertical-ai/risk_management/__pycache__/portfolio_risk.cpython-312.pyc b/vertical-ai/risk_management/__pycache__/portfolio_risk.cpython-312.pyc
new file mode 100644
index 0000000..a4595ef
Binary files /dev/null and b/vertical-ai/risk_management/__pycache__/portfolio_risk.cpython-312.pyc differ
diff --git a/vertical-ai/risk_management/__pycache__/position_sizer.cpython-312.pyc b/vertical-ai/risk_management/__pycache__/position_sizer.cpython-312.pyc
new file mode 100644
index 0000000..ab395b0
Binary files /dev/null and b/vertical-ai/risk_management/__pycache__/position_sizer.cpython-312.pyc differ
diff --git a/vertical-ai/risk_management/correlation_analyzer.py b/vertical-ai/risk_management/correlation_analyzer.py
new file mode 100644
index 0000000..b93edd8
--- /dev/null
+++ b/vertical-ai/risk_management/correlation_analyzer.py
@@ -0,0 +1,219 @@
+"""Correlation analysis: rolling asset correlations and clustering.
+
+Provides :class:`CorrelationAnalyzer` for tracking pairwise and portfolio-level
+correlation dynamics over time.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class CorrelationAnalyzer:
+    """Track rolling pairwise correlations between multiple assets.
+
+    Uses a rolling window of period returns to compute Pearson correlation
+    matrices and derived statistics such as average correlation and
+    minimum-variance cluster identification.
+
+    Attributes:
+        window: Rolling window size (number of periods).
+        min_periods: Minimum observations required before computing
+            correlation (defaults to half the window).
+    """
+
+    def __init__(
+        self,
+        window: int = 60,
+        min_periods: int | None = None,
+    ) -> None:
+        """Initialise CorrelationAnalyzer.
+
+        Args:
+            window: Look-back window for rolling correlation.
+            min_periods: Minimum periods of data required.  Defaults to
+                ``window // 2``.
+        """
+        if window < 2:
+            raise ValueError("window must be at least 2.")
+        self.window = window
+        self.min_periods = min_periods if min_periods is not None else window // 2
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def _validate_returns_matrix(
+        returns_matrix: Any,
+    ) -> tuple[np.ndarray, int, int]:
+        """Parse and validate the returns matrix.
+
+        Args:
+            returns_matrix: Array-like of shape ``(n_periods, n_assets)``.
+
+        Returns:
+            Tuple of (array, n_periods, n_assets).
+
+        Raises:
+            ValueError: If input is not 2-D or has fewer than 2 assets.
+        """
+        arr = np.asarray(returns_matrix, dtype=np.float64)
+        if arr.ndim != 2:
+            raise ValueError("returns_matrix must be 2-D (periods × assets).")
+        n_periods, n_assets = arr.shape
+        if n_assets < 2:
+            raise ValueError("At least 2 assets are required.")
+        return arr, n_periods, n_assets
+
+    @staticmethod
+    def _pearson_corr(x: np.ndarray, y: np.ndarray) -> float:
+        """Compute Pearson correlation between two arrays.
+
+        Args:
+            x: First array.
+            y: Second array.
+
+        Returns:
+            Pearson r, or ``nan`` if undefined.
+        """
+        if len(x) < 2:
+            return float("nan")
+        vx = x - np.mean(x)
+        vy = y - np.mean(y)
+        denom = np.sqrt(np.sum(vx ** 2) * np.sum(vy ** 2))
+        if denom == 0:
+            return float("nan")
+        return float(np.sum(vx * vy) / denom)
+
+    def _rolling_corr_pair(
+        self,
+        series_a: np.ndarray,
+        series_b: np.ndarray,
+    ) -> np.ndarray:
+        """Compute rolling Pearson correlation for a pair of series.
+
+        Args:
+            series_a: Return series for asset A.
+            series_b: Return series for asset B.
+
+        Returns:
+            Array of rolling correlations (NaN before min_periods).
+        """
+        n = len(series_a)
+        corrs = np.full(n, np.nan)
+        for i in range(n):
+            start = max(0, i - self.window + 1)
+            a_win = series_a[start: i + 1]
+            b_win = series_b[start: i + 1]
+            if len(a_win) >= self.min_periods:
+                corrs[i] = self._pearson_corr(a_win, b_win)
+        return corrs
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def compute_correlation_matrix(
+        self, returns_matrix: Any
+    ) -> dict[str, Any]:
+        """Compute the full-sample correlation matrix.
+
+        Args:
+            returns_matrix: Array-like of shape ``(n_periods, n_assets)``.
+
+        Returns:
+            Dict with keys ``correlation_matrix`` (2-D list),
+            ``average_correlation`` (float), ``n_assets``, ``n_periods``.
+        """
+        arr, n_periods, n_assets = self._validate_returns_matrix(returns_matrix)
+
+        if n_periods < self.min_periods:
+            raise ValueError(
+                f"Need at least {self.min_periods} periods; got {n_periods}."
+            )
+
+        corr_mat = np.corrcoef(arr.T)
+        # Mask diagonal for average off-diagonal correlation
+        mask = ~np.eye(n_assets, dtype=bool)
+        avg_corr = float(np.nanmean(corr_mat[mask]))
+
+        logger.debug(f"Correlation matrix: {n_assets}×{n_assets}, avg_corr={avg_corr:.4f}")
+        return {
+            "correlation_matrix": corr_mat.tolist(),
+            "average_correlation": avg_corr,
+            "n_assets": n_assets,
+            "n_periods": n_periods,
+        }
+
+    def rolling_correlations(
+        self,
+        returns_matrix: Any,
+        asset_names: list[str] | None = None,
+    ) -> dict[str, Any]:
+        """Compute rolling pairwise correlations for all asset pairs.
+
+        Args:
+            returns_matrix: Array-like of shape ``(n_periods, n_assets)``.
+            asset_names: Optional list of asset name strings.
+
+        Returns:
+            Dict mapping ``"asset_i_vs_asset_j"`` strings to lists of rolling
+            correlation values.
+        """
+        arr, n_periods, n_assets = self._validate_returns_matrix(returns_matrix)
+        names = asset_names or [f"asset_{i}" for i in range(n_assets)]
+
+        if len(names) != n_assets:
+            raise ValueError("asset_names length must match number of assets.")
+
+        result: dict[str, list[float | None]] = {}
+        for i in range(n_assets):
+            for j in range(i + 1, n_assets):
+                key = f"{names[i]}_vs_{names[j]}"
+                corrs = self._rolling_corr_pair(arr[:, i], arr[:, j])
+                result[key] = [None if np.isnan(v) else round(float(v), 6) for v in corrs]
+
+        logger.debug(f"Rolling correlations computed for {len(result)} pairs")
+        return result
+
+    def correlation_regime(
+        self, returns_matrix: Any
+    ) -> dict[str, Any]:
+        """Classify the current correlation regime.
+
+        Computes recent vs historical average correlation to detect risk-on /
+        risk-off regime shifts.
+
+        Args:
+            returns_matrix: Array-like of shape ``(n_periods, n_assets)``.
+
+        Returns:
+            Dict with keys ``current_avg_corr``, ``historical_avg_corr``,
+            ``regime`` (``"high"``, ``"normal"``, or ``"low"``).
+        """
+        arr, n_periods, n_assets = self._validate_returns_matrix(returns_matrix)
+        recent_n = min(self.window, n_periods)
+
+        historical_corr_mat = np.corrcoef(arr.T)
+        recent_corr_mat = np.corrcoef(arr[-recent_n:].T)
+
+        mask = ~np.eye(n_assets, dtype=bool)
+        hist_avg = float(np.nanmean(historical_corr_mat[mask]))
+        curr_avg = float(np.nanmean(recent_corr_mat[mask]))
+
+        if curr_avg > 0.7:
+            regime = "high"
+        elif curr_avg < 0.3:
+            regime = "low"
+        else:
+            regime = "normal"
+
+        return {
+            "current_avg_corr": round(curr_avg, 4),
+            "historical_avg_corr": round(hist_avg, 4),
+            "regime": regime,
+        }
diff --git a/vertical-ai/risk_management/portfolio_risk.py b/vertical-ai/risk_management/portfolio_risk.py
new file mode 100644
index 0000000..9562fe2
--- /dev/null
+++ b/vertical-ai/risk_management/portfolio_risk.py
@@ -0,0 +1,240 @@
+"""Portfolio risk: VaR, CVaR, and drawdown calculations.
+
+Provides :class:`PortfolioRisk` using pure NumPy / SciPy for all statistical
+computations.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from scipy import stats
+from loguru import logger
+
+
+class PortfolioRisk:
+    """Compute portfolio-level risk metrics from return time series.
+
+    Supports historical simulation and parametric (Gaussian) methods for
+    Value-at-Risk and Conditional Value-at-Risk, plus rolling and peak-to-trough
+    drawdown analysis.
+
+    Attributes:
+        confidence_level: Confidence level for VaR / CVaR (e.g., 0.95).
+        method: ``"historical"`` or ``"parametric"``.
+        annualisation_factor: Trading days per year used for annualised metrics.
+    """
+
+    def __init__(
+        self,
+        confidence_level: float = 0.95,
+        method: str = "historical",
+        annualisation_factor: int = 252,
+    ) -> None:
+        """Initialise PortfolioRisk.
+
+        Args:
+            confidence_level: Statistical confidence level (0 < cl < 1).
+            method: ``"historical"`` for empirical distribution or
+                ``"parametric"`` for Gaussian approximation.
+            annualisation_factor: Number of periods in a year.
+
+        Raises:
+            ValueError: If confidence_level or method are invalid.
+        """
+        if not 0 < confidence_level < 1:
+            raise ValueError("confidence_level must be in (0, 1).")
+        if method not in ("historical", "parametric"):
+            raise ValueError("method must be 'historical' or 'parametric'.")
+        self.confidence_level = confidence_level
+        self.method = method
+        self.annualisation_factor = annualisation_factor
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def _validate_returns(returns: Any) -> np.ndarray:
+        """Convert and validate a returns array.
+
+        Args:
+            returns: Array-like of period returns.
+
+        Returns:
+            Validated float64 array.
+
+        Raises:
+            ValueError: If the array is empty or 1-D check fails.
+        """
+        arr = np.asarray(returns, dtype=np.float64).ravel()
+        if arr.size < 2:
+            raise ValueError("returns must have at least 2 observations.")
+        return arr
+
+    def _var_historical(self, returns: np.ndarray) -> float:
+        """Compute VaR by empirical percentile.
+
+        Args:
+            returns: Return array.
+
+        Returns:
+            VaR as a positive number representing loss.
+        """
+        return float(-np.percentile(returns, (1 - self.confidence_level) * 100))
+
+    def _var_parametric(self, returns: np.ndarray) -> float:
+        """Compute parametric (Gaussian) VaR.
+
+        Args:
+            returns: Return array.
+
+        Returns:
+            VaR as a positive number.
+        """
+        mu = float(np.mean(returns))
+        sigma = float(np.std(returns, ddof=1))
+        z = stats.norm.ppf(1 - self.confidence_level)
+        return float(-(mu + z * sigma))
+
+    def _cvar_historical(self, returns: np.ndarray) -> float:
+        """Compute CVaR (Expected Shortfall) empirically.
+
+        Args:
+            returns: Return array.
+
+        Returns:
+            CVaR as a positive number.
+        """
+        cutoff = np.percentile(returns, (1 - self.confidence_level) * 100)
+        tail = returns[returns <= cutoff]
+        return float(-np.mean(tail)) if len(tail) > 0 else 0.0
+
+    def _cvar_parametric(self, returns: np.ndarray) -> float:
+        """Compute parametric CVaR (Gaussian).
+
+        Args:
+            returns: Return array.
+
+        Returns:
+            CVaR as a positive number.
+        """
+        mu = float(np.mean(returns))
+        sigma = float(np.std(returns, ddof=1))
+        alpha = 1 - self.confidence_level
+        z = stats.norm.ppf(alpha)
+        pdf_z = stats.norm.pdf(z)
+        cvar = -(mu + sigma * pdf_z / alpha)
+        return float(cvar)
+
+    @staticmethod
+    def _drawdown_series(cumulative_returns: np.ndarray) -> np.ndarray:
+        """Compute the drawdown at each point relative to peak.
+
+        Args:
+            cumulative_returns: Cumulative return series (e.g., wealth index).
+
+        Returns:
+            Drawdown array (non-positive values).
+        """
+        running_max = np.maximum.accumulate(cumulative_returns)
+        drawdown = (cumulative_returns - running_max) / (running_max + 1e-9)
+        return drawdown
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def compute_var(self, returns: Any) -> float:
+        """Compute Value-at-Risk.
+
+        Args:
+            returns: Array-like of period returns.
+
+        Returns:
+            VaR (positive = potential loss).
+        """
+        arr = self._validate_returns(returns)
+        if self.method == "parametric":
+            return self._var_parametric(arr)
+        return self._var_historical(arr)
+
+    def compute_cvar(self, returns: Any) -> float:
+        """Compute Conditional Value-at-Risk (Expected Shortfall).
+
+        Args:
+            returns: Array-like of period returns.
+
+        Returns:
+            CVaR (positive = expected loss beyond VaR threshold).
+        """
+        arr = self._validate_returns(returns)
+        if self.method == "parametric":
+            return self._cvar_parametric(arr)
+        return self._cvar_historical(arr)
+
+    def compute_drawdowns(self, returns: Any) -> dict[str, float]:
+        """Compute drawdown metrics from a return series.
+
+        Args:
+            returns: Array-like of period returns.
+
+        Returns:
+            Dict with keys ``max_drawdown``, ``avg_drawdown``,
+            ``current_drawdown``, ``drawdown_duration`` (in periods).
+        """
+        arr = self._validate_returns(returns)
+        cum = np.cumprod(1 + arr)
+        dd = self._drawdown_series(cum)
+
+        max_dd = float(np.min(dd))
+        avg_dd = float(np.mean(dd[dd < 0])) if np.any(dd < 0) else 0.0
+        current_dd = float(dd[-1])
+
+        # Longest streak below zero
+        in_dd = (dd < 0).astype(int)
+        max_duration = 0
+        current_streak = 0
+        for v in in_dd:
+            current_streak = current_streak + 1 if v else 0
+            max_duration = max(max_duration, current_streak)
+
+        return {
+            "max_drawdown": max_dd,
+            "avg_drawdown": avg_dd,
+            "current_drawdown": current_dd,
+            "drawdown_duration": max_duration,
+        }
+
+    def full_risk_report(self, returns: Any) -> dict[str, Any]:
+        """Generate a full risk report for a return series.
+
+        Args:
+            returns: Array-like of period returns.
+
+        Returns:
+            Dict containing VaR, CVaR, drawdown metrics, volatility, and
+            annualised Sharpe ratio (assuming zero risk-free rate).
+        """
+        arr = self._validate_returns(returns)
+        logger.debug(f"Computing full risk report for {len(arr)} returns")
+
+        var = self.compute_var(arr)
+        cvar = self.compute_cvar(arr)
+        dd = self.compute_drawdowns(arr)
+
+        vol = float(np.std(arr, ddof=1)) * np.sqrt(self.annualisation_factor)
+        ann_return = float(np.mean(arr)) * self.annualisation_factor
+        sharpe = ann_return / vol if vol > 0 else 0.0
+
+        return {
+            "var": var,
+            "cvar": cvar,
+            **dd,
+            "annualised_volatility": vol,
+            "annualised_return": ann_return,
+            "sharpe_ratio": sharpe,
+            "confidence_level": self.confidence_level,
+            "method": self.method,
+        }
diff --git a/vertical-ai/risk_management/position_sizer.py b/vertical-ai/risk_management/position_sizer.py
new file mode 100644
index 0000000..bb36d13
--- /dev/null
+++ b/vertical-ai/risk_management/position_sizer.py
@@ -0,0 +1,203 @@
+"""Position sizing: Kelly criterion, fixed fraction, and volatility targeting.
+
+Provides :class:`PositionSizer` which implements three complementary position
+sizing methodologies for risk-controlled trade allocation.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+import numpy as np
+from loguru import logger
+
+
+class PositionSizer:
+    """Compute optimal position sizes using multiple sizing methodologies.
+
+    Implements:
+
+    * **Kelly Criterion** – maximises expected logarithmic growth.
+    * **Fixed Fraction** – simple risk-per-trade percentage.
+    * **Volatility Targeting** – size inversely proportional to asset vol.
+
+    Attributes:
+        max_position_fraction: Hard cap on any single position as a fraction
+            of portfolio equity (0 < cap ≤ 1).
+        annualisation_factor: Trading periods per year for volatility scaling.
+    """
+
+    def __init__(
+        self,
+        max_position_fraction: float = 0.25,
+        annualisation_factor: int = 252,
+    ) -> None:
+        """Initialise PositionSizer.
+
+        Args:
+            max_position_fraction: Maximum fraction of capital for any single
+                position.
+            annualisation_factor: Used to annualise daily volatility.
+
+        Raises:
+            ValueError: If max_position_fraction is outside (0, 1].
+        """
+        if not 0 < max_position_fraction <= 1:
+            raise ValueError("max_position_fraction must be in (0, 1].")
+        self.max_position_fraction = max_position_fraction
+        self.annualisation_factor = annualisation_factor
+
+    # ------------------------------------------------------------------
+    # Private helpers
+    # ------------------------------------------------------------------
+
+    def _cap(self, fraction: float) -> float:
+        """Apply the maximum position fraction cap.
+
+        Args:
+            fraction: Raw computed position fraction.
+
+        Returns:
+            Capped fraction.
+        """
+        return float(np.clip(fraction, 0.0, self.max_position_fraction))
+
+    # ------------------------------------------------------------------
+    # Public interface
+    # ------------------------------------------------------------------
+
+    def kelly_criterion(
+        self,
+        win_rate: float,
+        win_loss_ratio: float,
+        kelly_fraction: float = 1.0,
+    ) -> float:
+        """Compute Kelly-optimal position fraction.
+
+        Uses the simplified discrete Kelly formula:
+        ``f* = (p * b - q) / b`` where *p* is the win probability, *b* is the
+        win/loss ratio, and *q = 1 - p*.
+
+        Args:
+            win_rate: Probability of a winning trade (0 < p < 1).
+            win_loss_ratio: Average win divided by average loss (b > 0).
+            kelly_fraction: Fractional Kelly multiplier to reduce variance
+                (commonly 0.25–0.5 in practice).
+
+        Returns:
+            Optimal position size as fraction of capital.
+
+        Raises:
+            ValueError: If inputs are out of range.
+        """
+        if not 0 < win_rate < 1:
+            raise ValueError("win_rate must be in (0, 1).")
+        if win_loss_ratio <= 0:
+            raise ValueError("win_loss_ratio must be positive.")
+        if not 0 < kelly_fraction <= 1:
+            raise ValueError("kelly_fraction must be in (0, 1].")
+
+        p = win_rate
+        q = 1.0 - p
+        b = win_loss_ratio
+        raw_kelly = (p * b - q) / b
+        adjusted = raw_kelly * kelly_fraction
+
+        result = self._cap(max(adjusted, 0.0))
+        logger.debug(f"Kelly: raw={raw_kelly:.4f}, adjusted={adjusted:.4f}, capped={result:.4f}")
+        return result
+
+    def fixed_fraction(
+        self,
+        risk_per_trade: float,
+        stop_loss_pct: float,
+        capital: float,
+        price: float,
+    ) -> dict[str, float]:
+        """Compute fixed-fraction position size from a stop-loss percentage.
+
+        Position size is calculated as:
+        ``n_shares = (capital × risk_fraction) / (price × stop_loss_pct)``
+
+        Args:
+            risk_per_trade: Fraction of capital to risk per trade (e.g., 0.01).
+            stop_loss_pct: Stop-loss distance as fraction of price (e.g., 0.02).
+            capital: Total portfolio capital in currency units.
+            price: Current asset price in currency units.
+
+        Returns:
+            Dict with keys ``position_fraction``, ``shares``, ``risk_amount``.
+
+        Raises:
+            ValueError: If stop_loss_pct is zero or negative.
+        """
+        if stop_loss_pct <= 0:
+            raise ValueError("stop_loss_pct must be positive.")
+        if price <= 0:
+            raise ValueError("price must be positive.")
+
+        risk_amount = capital * risk_per_trade
+        shares = risk_amount / (price * stop_loss_pct)
+        position_value = shares * price
+        position_fraction = self._cap(position_value / capital if capital > 0 else 0.0)
+        # Re-scale shares if the fraction was capped
+        actual_shares = (position_fraction * capital) / price
+
+        logger.debug(
+            f"Fixed-fraction: risk={risk_amount:.2f}, shares={actual_shares:.4f}, "
+            f"fraction={position_fraction:.4f}"
+        )
+        return {
+            "position_fraction": position_fraction,
+            "shares": actual_shares,
+            "risk_amount": risk_amount,
+        }
+
+    def volatility_targeting(
+        self,
+        returns: Any,
+        target_volatility: float,
+        capital: float,
+        price: float,
+    ) -> dict[str, float]:
+        """Compute position size to achieve a target annualised volatility.
+
+        Position fraction = ``target_vol / asset_annualised_vol``.
+
+        Args:
+            returns: Array-like of recent period returns for the asset.
+            target_volatility: Target annualised portfolio volatility.
+            capital: Total portfolio capital.
+            price: Current asset price.
+
+        Returns:
+            Dict with keys ``position_fraction``, ``shares``,
+            ``asset_volatility``.
+
+        Raises:
+            ValueError: If returns array is too short.
+        """
+        arr = np.asarray(returns, dtype=np.float64).ravel()
+        if arr.size < 2:
+            raise ValueError("returns must have at least 2 observations.")
+
+        daily_vol = float(np.std(arr, ddof=1))
+        ann_vol = daily_vol * np.sqrt(self.annualisation_factor)
+
+        if ann_vol == 0:
+            logger.warning("Asset volatility is zero; defaulting to max fraction.")
+            fraction = self.max_position_fraction
+        else:
+            fraction = self._cap(target_volatility / ann_vol)
+
+        shares = (fraction * capital) / price if price > 0 else 0.0
+
+        logger.debug(
+            f"Vol-targeting: ann_vol={ann_vol:.4f}, target={target_volatility:.4f}, "
+            f"fraction={fraction:.4f}"
+        )
+        return {
+            "position_fraction": fraction,
+            "shares": shares,
+            "asset_volatility": ann_vol,
+        }