From f055c21e3d832a9e821fd73458134b1e37cd3eb5 Mon Sep 17 00:00:00 2001
From: Imran Siddique <imran.siddique@microsoft.com>
Date: Thu, 5 Feb 2026 14:18:50 -0800
Subject: [PATCH 1/4] [Contrib] Agent-OS Governance Module

Adds kernel-level governance for CrewAI workflows.

Features:
- GovernancePolicy: Define rules for crew behavior
- GovernedAgent: Wrap individual agents with policy enforcement
- GovernedCrew: Govern entire crews with shared policy
- Content filtering with blocked patterns
- Tool filtering (blocked/allowed lists)
- Full audit trail

Integration with Agent-OS kernel for enterprise governance.

See: https://github.com/imran-siddique/agent-os
---
 src/crewai/governance/README.md   | 161 +++++++++++
 src/crewai/governance/__init__.py |  20 ++
 src/crewai/governance/_kernel.py  | 431 ++++++++++++++++++++++++++++++
 3 files changed, 612 insertions(+)
 create mode 100644 src/crewai/governance/README.md
 create mode 100644 src/crewai/governance/__init__.py
 create mode 100644 src/crewai/governance/_kernel.py

diff --git a/src/crewai/governance/README.md b/src/crewai/governance/README.md
new file mode 100644
index 0000000000..22270fee74
--- /dev/null
+++ b/src/crewai/governance/README.md
@@ -0,0 +1,161 @@
+# Agent-OS Governance for CrewAI
+
+Kernel-level policy enforcement for CrewAI workflows using [Agent-OS](https://github.com/imran-siddique/agent-os).
+
+## Features
+
+- **Policy Enforcement**: Define rules for agent behavior within crews
+- **Tool Filtering**: Control which tools agents can use
+- **Content Filtering**: Block dangerous patterns in outputs
+- **Rate Limiting**: Limit iterations and tool calls
+- **Audit Trail**: Full logging of all crew activities
+
+## Installation
+
+```bash
+pip install crewai[governance]
+# or
+pip install agent-os-kernel
+```
+
+## Quick Start
+
+```python
+from crewai import Agent, Crew, Task
+from crewai.governance import GovernedCrew, GovernancePolicy
+
+# Create policy
+policy = GovernancePolicy(
+    max_tool_calls=20,
+    max_iterations=15,
+    blocked_patterns=["DROP TABLE", "rm -rf", "DELETE FROM"],
+    blocked_tools=["shell_tool"],
+)
+
+# Create agents
+researcher = Agent(
+    role="Researcher",
+    goal="Find accurate information",
+    backstory="Expert researcher",
+)
+
+writer = Agent(
+    role="Writer",
+    goal="Write clear reports",
+    backstory="Technical writer",
+)
+
+# Create tasks
+research_task = Task(
+    description="Research AI governance",
+    agent=researcher,
+)
+
+write_task = Task(
+    description="Write summary report",
+    agent=writer,
+)
+
+# Create crew
+crew = Crew(
+    agents=[researcher, writer],
+    tasks=[research_task, write_task],
+)
+
+# Govern the crew
+governed_crew = GovernedCrew(crew, policy)
+
+# Execute with governance
+result = governed_crew.kickoff()
+
+# Check for violations
+print(f"Violations: {len(governed_crew.violations)}")
+print(f"Audit events: {len(governed_crew.audit_log)}")
+```
+
+## Policy Options
+
+```python
+GovernancePolicy(
+    # Limits
+    max_tool_calls=50,       # Max tool invocations per task
+    max_iterations=25,       # Max agent iterations
+    max_execution_time=600,  # Max seconds for entire crew
+    
+    # Tool Control
+    allowed_tools=["search", "calculator"],  # Whitelist
+    blocked_tools=["shell_tool", "file_delete"],  # Blacklist
+    
+    # Content Filtering
+    blocked_patterns=["DROP TABLE", "rm -rf"],
+    max_output_length=100_000,
+    
+    # Approval
+    require_human_approval=False,
+    approval_tools=["database_write"],
+    
+    # Audit
+    log_all_actions=True,
+)
+```
+
+## Handling Violations
+
+```python
+def on_violation(violation):
+    print(f"BLOCKED: {violation.policy_name}")
+    print(f"  Agent: {violation.agent_name}")
+    print(f"  Reason: {violation.description}")
+    # Send alert, log to SIEM, etc.
+
+governed_crew = GovernedCrew(
+    crew=crew,
+    policy=policy,
+    on_violation=on_violation,
+)
+```
+
+## Audit Trail
+
+```python
+# Get detailed audit log
+for event in governed_crew.audit_log:
+    print(f"{event.timestamp}: {event.event_type}")
+    if event.agent_name:
+        print(f"  Agent: {event.agent_name}")
+    print(f"  Details: {event.details}")
+
+# Get summary
+summary = governed_crew.get_audit_summary()
+print(f"Total violations: {summary['total_violations']}")
+print(f"Violations by type: {summary['violations_by_type']}")
+```
+
+## Integration with Agent-OS Kernel
+
+For full kernel-level governance:
+
+```python
+from agent_os import KernelSpace
+from agent_os.policies import SQLPolicy, CostControlPolicy
+from crewai.governance import GovernedCrew
+
+# Create kernel with policies
+kernel = KernelSpace(policy=[
+    SQLPolicy(allow=["SELECT"], deny=["DROP", "DELETE"]),
+    CostControlPolicy(max_cost_usd=100),
+])
+
+# Wrap crew execution in kernel
+@kernel.register
+async def run_crew(inputs):
+    return governed_crew.kickoff(inputs=inputs)
+
+# Execute with full governance
+result = await kernel.execute(run_crew, {"topic": "AI safety"})
+```
+
+## Links
+
+- [Agent-OS GitHub](https://github.com/imran-siddique/agent-os)
+- [CrewAI Documentation](https://docs.crewai.com)
diff --git a/src/crewai/governance/__init__.py b/src/crewai/governance/__init__.py
new file mode 100644
index 0000000000..c5ca30b405
--- /dev/null
+++ b/src/crewai/governance/__init__.py
@@ -0,0 +1,20 @@
+# Copyright (c) Agent-OS Contributors. All rights reserved.
+# Licensed under the MIT License.
+"""Agent-OS Governance for CrewAI.
+
+Provides kernel-level policy enforcement for CrewAI workflows.
+"""
+
+from ._kernel import (
+    GovernancePolicy,
+    GovernedAgent,
+    GovernedCrew,
+    PolicyViolation,
+)
+
+__all__ = [
+    "GovernancePolicy",
+    "GovernedAgent",
+    "GovernedCrew",
+    "PolicyViolation",
+]
diff --git a/src/crewai/governance/_kernel.py b/src/crewai/governance/_kernel.py
new file mode 100644
index 0000000000..fbb4ef8747
--- /dev/null
+++ b/src/crewai/governance/_kernel.py
@@ -0,0 +1,431 @@
+# Copyright (c) Agent-OS Contributors. All rights reserved.
+# Licensed under the MIT License.
+"""Kernel-level governance for CrewAI agents and crews."""
+
+from __future__ import annotations
+
+import re
+import time
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum
+from functools import wraps
+from typing import Any, Callable, Dict, List, Optional, Set
+
+try:
+    from crewai import Agent, Crew, Task
+except ImportError:
+    Agent = Any
+    Crew = Any
+    Task = Any
+
+
+class ViolationType(Enum):
+    """Types of policy violations."""
+
+    TOOL_BLOCKED = "tool_blocked"
+    TOOL_LIMIT_EXCEEDED = "tool_limit_exceeded"
+    MESSAGE_BLOCKED = "message_blocked"
+    MESSAGE_LIMIT_EXCEEDED = "message_limit_exceeded"
+    TIMEOUT = "timeout"
+    CONTENT_FILTERED = "content_filtered"
+
+
+@dataclass
+class PolicyViolation:
+    """Represents a policy violation event."""
+
+    violation_type: ViolationType
+    policy_name: str
+    description: str
+    timestamp: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    agent_name: Optional[str] = None
+    task_name: Optional[str] = None
+    details: Dict[str, Any] = field(default_factory=dict)
+
+
+@dataclass
+class AuditEvent:
+    """Audit trail event."""
+
+    event_type: str
+    timestamp: datetime
+    agent_name: Optional[str]
+    task_name: Optional[str]
+    details: Dict[str, Any]
+
+
+@dataclass
+class GovernancePolicy:
+    """Policy configuration for crew governance.
+
+    Attributes:
+        max_tool_calls: Maximum tool invocations per task.
+        max_iterations: Maximum agent iterations per task.
+        max_execution_time: Maximum seconds per task.
+        blocked_patterns: Regex patterns to block in outputs.
+        blocked_tools: Tools that cannot be used.
+        allowed_tools: If set, only these tools can be used.
+        require_human_approval: Require approval for certain actions.
+        approval_tools: Tools requiring human approval.
+        log_all_actions: Log all agent actions.
+        max_output_length: Maximum output length in characters.
+    """
+
+    max_tool_calls: int = 50
+    max_iterations: int = 25
+    max_execution_time: int = 600
+    blocked_patterns: List[str] = field(default_factory=list)
+    blocked_tools: List[str] = field(default_factory=list)
+    allowed_tools: Optional[List[str]] = None
+    require_human_approval: bool = False
+    approval_tools: List[str] = field(default_factory=list)
+    log_all_actions: bool = True
+    max_output_length: int = 100_000
+
+    def __post_init__(self):
+        """Compile regex patterns."""
+        self._compiled_patterns = [
+            re.compile(p, re.IGNORECASE) for p in self.blocked_patterns
+        ]
+
+
+class GovernedAgent:
+    """Wraps a CrewAI Agent with governance policies.
+
+    Example:
+        ```python
+        from crewai import Agent
+        from crewai.governance import GovernedAgent, GovernancePolicy
+
+        policy = GovernancePolicy(
+            max_tool_calls=10,
+            blocked_tools=["shell_tool"],
+        )
+
+        researcher = Agent(
+            role="Researcher",
+            goal="Find information",
+            backstory="Expert researcher",
+        )
+
+        governed_researcher = GovernedAgent(researcher, policy)
+        ```
+    """
+
+    def __init__(
+        self,
+        agent: Agent,
+        policy: GovernancePolicy,
+        on_violation: Optional[Callable[[PolicyViolation], None]] = None,
+    ):
+        """Initialize governed agent.
+
+        Args:
+            agent: The CrewAI agent to govern.
+            policy: Governance policy to enforce.
+            on_violation: Callback when violations occur.
+        """
+        self.agent = agent
+        self.policy = policy
+        self.on_violation = on_violation
+        self._tool_calls = 0
+        self._iterations = 0
+        self._start_time: Optional[float] = None
+        self._violations: List[PolicyViolation] = []
+        self._audit_log: List[AuditEvent] = []
+
+        # Wrap agent's execute method
+        self._wrap_execution()
+
+    def _wrap_execution(self):
+        """Wrap the agent's execution to add governance."""
+        original_execute = getattr(self.agent, "execute_task", None)
+        if original_execute is None:
+            return
+
+        @wraps(original_execute)
+        def governed_execute(task: Any, context: Optional[str] = None, tools: Optional[List] = None):
+            self._start_time = time.time()
+            self._tool_calls = 0
+            self._iterations = 0
+
+            # Filter tools based on policy
+            if tools:
+                tools = self._filter_tools(tools)
+
+            # Execute with governance
+            try:
+                result = original_execute(task, context, tools)
+                # Check output for violations
+                result = self._check_output(result, task)
+                return result
+            finally:
+                self._log_event("task_completed", task=task)
+
+        self.agent.execute_task = governed_execute
+
+    def _filter_tools(self, tools: List[Any]) -> List[Any]:
+        """Filter tools based on policy."""
+        filtered = []
+        for tool in tools:
+            tool_name = getattr(tool, "name", str(tool))
+
+            # Check blocked list
+            if tool_name in self.policy.blocked_tools:
+                self._record_violation(
+                    ViolationType.TOOL_BLOCKED,
+                    f"Tool '{tool_name}' is blocked by policy",
+                    tool_name=tool_name,
+                )
+                continue
+
+            # Check allowed list
+            if (
+                self.policy.allowed_tools is not None
+                and tool_name not in self.policy.allowed_tools
+            ):
+                self._record_violation(
+                    ViolationType.TOOL_BLOCKED,
+                    f"Tool '{tool_name}' not in allowed list",
+                    tool_name=tool_name,
+                )
+                continue
+
+            filtered.append(tool)
+
+        return filtered
+
+    def _check_output(self, output: Any, task: Any) -> Any:
+        """Check output for policy violations."""
+        if output is None:
+            return output
+
+        output_str = str(output)
+
+        # Check length
+        if len(output_str) > self.policy.max_output_length:
+            self._record_violation(
+                ViolationType.CONTENT_FILTERED,
+                f"Output exceeds max length ({len(output_str)} > {self.policy.max_output_length})",
+            )
+            output_str = output_str[: self.policy.max_output_length]
+
+        # Check patterns
+        for pattern in self.policy._compiled_patterns:
+            if pattern.search(output_str):
+                self._record_violation(
+                    ViolationType.CONTENT_FILTERED,
+                    f"Output contains blocked pattern: {pattern.pattern}",
+                    pattern=pattern.pattern,
+                )
+                output_str = pattern.sub("[BLOCKED]", output_str)
+
+        return output_str if isinstance(output, str) else output
+
+    def _record_violation(
+        self,
+        violation_type: ViolationType,
+        description: str,
+        **details: Any,
+    ):
+        """Record a policy violation."""
+        violation = PolicyViolation(
+            violation_type=violation_type,
+            policy_name=violation_type.value,
+            description=description,
+            agent_name=getattr(self.agent, "role", "unknown"),
+            details=details,
+        )
+        self._violations.append(violation)
+
+        if self.on_violation:
+            self.on_violation(violation)
+
+        self._log_event(
+            "violation",
+            violation_type=violation_type.value,
+            description=description,
+        )
+
+    def _log_event(self, event_type: str, **details: Any):
+        """Log an audit event."""
+        if not self.policy.log_all_actions:
+            return
+
+        event = AuditEvent(
+            event_type=event_type,
+            timestamp=datetime.now(timezone.utc),
+            agent_name=getattr(self.agent, "role", "unknown"),
+            task_name=details.get("task_name"),
+            details=details,
+        )
+        self._audit_log.append(event)
+
+    @property
+    def violations(self) -> List[PolicyViolation]:
+        """Get all violations."""
+        return self._violations.copy()
+
+    @property
+    def audit_log(self) -> List[AuditEvent]:
+        """Get audit log."""
+        return self._audit_log.copy()
+
+
+class GovernedCrew:
+    """Wraps a CrewAI Crew with governance policies.
+
+    Example:
+        ```python
+        from crewai import Agent, Crew, Task
+        from crewai.governance import GovernedCrew, GovernancePolicy
+
+        policy = GovernancePolicy(
+            max_tool_calls=20,
+            max_iterations=15,
+            blocked_patterns=["DROP TABLE", "rm -rf"],
+        )
+
+        crew = Crew(
+            agents=[researcher, writer],
+            tasks=[research_task, write_task],
+        )
+
+        governed_crew = GovernedCrew(crew, policy)
+        result = governed_crew.kickoff()
+        print(f"Violations: {len(governed_crew.violations)}")
+        ```
+    """
+
+    def __init__(
+        self,
+        crew: Crew,
+        policy: GovernancePolicy,
+        on_violation: Optional[Callable[[PolicyViolation], None]] = None,
+    ):
+        """Initialize governed crew.
+
+        Args:
+            crew: The CrewAI crew to govern.
+            policy: Governance policy to enforce.
+            on_violation: Callback when violations occur.
+        """
+        self.crew = crew
+        self.policy = policy
+        self.on_violation = on_violation
+        self._violations: List[PolicyViolation] = []
+        self._audit_log: List[AuditEvent] = []
+        self._governed_agents: List[GovernedAgent] = []
+
+        # Wrap all agents
+        self._wrap_agents()
+
+    def _wrap_agents(self):
+        """Wrap all crew agents with governance."""
+        for i, agent in enumerate(self.crew.agents):
+            governed = GovernedAgent(agent, self.policy, self._handle_violation)
+            self._governed_agents.append(governed)
+            # Note: agents are already wrapped in place
+
+    def _handle_violation(self, violation: PolicyViolation):
+        """Handle violations from governed agents."""
+        self._violations.append(violation)
+        if self.on_violation:
+            self.on_violation(violation)
+
+    def kickoff(self, inputs: Optional[Dict[str, Any]] = None) -> Any:
+        """Execute the crew with governance.
+
+        Args:
+            inputs: Optional inputs for the crew.
+
+        Returns:
+            Crew execution result.
+        """
+        self._log_event("crew_started", inputs=inputs)
+        start_time = time.time()
+
+        try:
+            result = self.crew.kickoff(inputs=inputs)
+
+            # Check execution time
+            elapsed = time.time() - start_time
+            if elapsed > self.policy.max_execution_time:
+                self._record_violation(
+                    ViolationType.TIMEOUT,
+                    f"Execution time ({elapsed:.1f}s) exceeded limit ({self.policy.max_execution_time}s)",
+                )
+
+            return result
+        finally:
+            self._log_event(
+                "crew_completed",
+                duration=time.time() - start_time,
+                violations=len(self._violations),
+            )
+
+    def _record_violation(
+        self,
+        violation_type: ViolationType,
+        description: str,
+        **details: Any,
+    ):
+        """Record a crew-level violation."""
+        violation = PolicyViolation(
+            violation_type=violation_type,
+            policy_name=violation_type.value,
+            description=description,
+            details=details,
+        )
+        self._violations.append(violation)
+
+        if self.on_violation:
+            self.on_violation(violation)
+
+    def _log_event(self, event_type: str, **details: Any):
+        """Log audit event."""
+        if not self.policy.log_all_actions:
+            return
+
+        event = AuditEvent(
+            event_type=event_type,
+            timestamp=datetime.now(timezone.utc),
+            agent_name=None,
+            task_name=None,
+            details=details,
+        )
+        self._audit_log.append(event)
+
+    @property
+    def violations(self) -> List[PolicyViolation]:
+        """Get all violations from crew and agents."""
+        all_violations = self._violations.copy()
+        for agent in self._governed_agents:
+            all_violations.extend(agent.violations)
+        return all_violations
+
+    @property
+    def audit_log(self) -> List[AuditEvent]:
+        """Get full audit log."""
+        all_events = self._audit_log.copy()
+        for agent in self._governed_agents:
+            all_events.extend(agent.audit_log)
+        return sorted(all_events, key=lambda e: e.timestamp)
+
+    def get_audit_summary(self) -> Dict[str, Any]:
+        """Get summary of governance audit."""
+        return {
+            "total_violations": len(self.violations),
+            "violations_by_type": self._count_by_type(),
+            "total_events": len(self.audit_log),
+            "agents": [a.agent.role for a in self._governed_agents],
+        }
+
+    def _count_by_type(self) -> Dict[str, int]:
+        """Count violations by type."""
+        counts: Dict[str, int] = {}
+        for v in self.violations:
+            key = v.violation_type.value
+            counts[key] = counts.get(key, 0) + 1
+        return counts

From b8fda27dad126250e1428d5748e896e710cd86c0 Mon Sep 17 00:00:00 2001
From: Imran Siddique <imran.siddique@microsoft.com>
Date: Thu, 5 Feb 2026 14:36:59 -0800
Subject: [PATCH 2/4] fix: Address review comments

- Fix content filtering bypass for non-string outputs
- Fix double-counting of agent violations in crew totals
- Remove unimplemented human approval features from docs
- Add warning when agent lacks execute_task method
- Use getattr consistently for agent.role access
- Clarify rate limiting requires CrewAI callback integration
---
 src/crewai/governance/README.md  | 10 ++-----
 src/crewai/governance/_kernel.py | 49 ++++++++++++++++++++++++--------
 2 files changed, 40 insertions(+), 19 deletions(-)

diff --git a/src/crewai/governance/README.md b/src/crewai/governance/README.md
index 22270fee74..fa7425e6ff 100644
--- a/src/crewai/governance/README.md
+++ b/src/crewai/governance/README.md
@@ -77,23 +77,19 @@ print(f"Audit events: {len(governed_crew.audit_log)}")
 
 ```python
 GovernancePolicy(
-    # Limits
+    # Limits (tracked, enforcement requires CrewAI callbacks)
     max_tool_calls=50,       # Max tool invocations per task
     max_iterations=25,       # Max agent iterations
     max_execution_time=600,  # Max seconds for entire crew
     
-    # Tool Control
+    # Tool Control (enforced via tool filtering)
     allowed_tools=["search", "calculator"],  # Whitelist
     blocked_tools=["shell_tool", "file_delete"],  # Blacklist
     
-    # Content Filtering
+    # Content Filtering (enforced on outputs)
     blocked_patterns=["DROP TABLE", "rm -rf"],
     max_output_length=100_000,
     
-    # Approval
-    require_human_approval=False,
-    approval_tools=["database_write"],
-    
     # Audit
     log_all_actions=True,
 )
diff --git a/src/crewai/governance/_kernel.py b/src/crewai/governance/_kernel.py
index fbb4ef8747..2db4f04607 100644
--- a/src/crewai/governance/_kernel.py
+++ b/src/crewai/governance/_kernel.py
@@ -66,10 +66,12 @@ class GovernancePolicy:
         blocked_patterns: Regex patterns to block in outputs.
         blocked_tools: Tools that cannot be used.
         allowed_tools: If set, only these tools can be used.
-        require_human_approval: Require approval for certain actions.
-        approval_tools: Tools requiring human approval.
         log_all_actions: Log all agent actions.
         max_output_length: Maximum output length in characters.
+        
+    Note:
+        max_tool_calls and max_iterations are tracked but enforcement
+        requires CrewAI callback integration (future enhancement).
     """
 
     max_tool_calls: int = 50
@@ -78,8 +80,6 @@ class GovernancePolicy:
     blocked_patterns: List[str] = field(default_factory=list)
     blocked_tools: List[str] = field(default_factory=list)
     allowed_tools: Optional[List[str]] = None
-    require_human_approval: bool = False
-    approval_tools: List[str] = field(default_factory=list)
     log_all_actions: bool = True
     max_output_length: int = 100_000
 
@@ -140,8 +140,17 @@ def __init__(
 
     def _wrap_execution(self):
         """Wrap the agent's execution to add governance."""
+        import logging
+        logger = logging.getLogger(__name__)
+        
         original_execute = getattr(self.agent, "execute_task", None)
         if original_execute is None:
+            agent_name = getattr(self.agent, "role", "unknown")
+            logger.warning(
+                "GovernedAgent: Agent '%s' lacks 'execute_task' method. "
+                "Governance will NOT be applied to this agent.",
+                agent_name,
+            )
             return
 
         @wraps(original_execute)
@@ -197,11 +206,17 @@ def _filter_tools(self, tools: List[Any]) -> List[Any]:
         return filtered
 
     def _check_output(self, output: Any, task: Any) -> Any:
-        """Check output for policy violations."""
+        """Check output for policy violations.
+        
+        Note: For non-string outputs, violations are detected and logged,
+        but the original object is returned. To fully sanitize complex
+        objects, serialize them first.
+        """
         if output is None:
             return output
 
         output_str = str(output)
+        was_modified = False
 
         # Check length
         if len(output_str) > self.policy.max_output_length:
@@ -210,6 +225,7 @@ def _check_output(self, output: Any, task: Any) -> Any:
                 f"Output exceeds max length ({len(output_str)} > {self.policy.max_output_length})",
             )
             output_str = output_str[: self.policy.max_output_length]
+            was_modified = True
 
         # Check patterns
         for pattern in self.policy._compiled_patterns:
@@ -220,8 +236,15 @@ def _check_output(self, output: Any, task: Any) -> Any:
                     pattern=pattern.pattern,
                 )
                 output_str = pattern.sub("[BLOCKED]", output_str)
+                was_modified = True
 
-        return output_str if isinstance(output, str) else output
+        # Return sanitized string, or log warning for non-string outputs
+        if isinstance(output, str):
+            return output_str
+        elif was_modified:
+            # Non-string output with violations - return sanitized string representation
+            return output_str
+        return output
 
     def _record_violation(
         self,
@@ -399,11 +422,13 @@ def _log_event(self, event_type: str, **details: Any):
 
     @property
     def violations(self) -> List[PolicyViolation]:
-        """Get all violations from crew and agents."""
-        all_violations = self._violations.copy()
-        for agent in self._governed_agents:
-            all_violations.extend(agent.violations)
-        return all_violations
+        """Get all violations from crew and agents.
+        
+        Note: Agent violations are already collected via the callback,
+        so we only return crew-level violations here. Agent violations
+        are forwarded to self._violations via _handle_violation.
+        """
+        return self._violations.copy()
 
     @property
     def audit_log(self) -> List[AuditEvent]:
@@ -419,7 +444,7 @@ def get_audit_summary(self) -> Dict[str, Any]:
             "total_violations": len(self.violations),
             "violations_by_type": self._count_by_type(),
             "total_events": len(self.audit_log),
-            "agents": [a.agent.role for a in self._governed_agents],
+            "agents": [getattr(a.agent, "role", "unknown") for a in self._governed_agents],
         }
 
     def _count_by_type(self) -> Dict[str, int]:

From 6bda520a6bcf67b68312ad98dd2c3b36c862e52e Mon Sep 17 00:00:00 2001
From: Imran Siddique <imran.siddique@microsoft.com>
Date: Thu, 5 Feb 2026 15:55:39 -0800
Subject: [PATCH 3/4] fix: Address all review comments

1. Rate limiting now enforced:
   - _tool_calls incremented when tools pass filter
   - _iterations incremented after each execution
   - TOOL_LIMIT_EXCEEDED and ITERATION_LIMIT_EXCEEDED violations raised

2. Content filter return type: Already fixed (returns sanitized string)

3. Timeout enforcement: Clarified in docstring that it's audit-only
   post-execution check. Real-time enforcement needs asyncio.timeout.

4. Audit event task_name: Fixed key mismatch - now extracts from
   both 'task_name' and 'task' object (via .description or .name)

5. Crew violations in audit log: _record_violation now calls
   _log_event to ensure all violations appear in audit trail
---
 src/crewai/governance/_kernel.py | 53 ++++++++++++++++++++++++++++++--
 1 file changed, 51 insertions(+), 2 deletions(-)

diff --git a/src/crewai/governance/_kernel.py b/src/crewai/governance/_kernel.py
index 2db4f04607..46f4b96005 100644
--- a/src/crewai/governance/_kernel.py
+++ b/src/crewai/governance/_kernel.py
@@ -25,6 +25,7 @@ class ViolationType(Enum):
 
     TOOL_BLOCKED = "tool_blocked"
     TOOL_LIMIT_EXCEEDED = "tool_limit_exceeded"
+    ITERATION_LIMIT_EXCEEDED = "iteration_limit_exceeded"
     MESSAGE_BLOCKED = "message_blocked"
     MESSAGE_LIMIT_EXCEEDED = "message_limit_exceeded"
     TIMEOUT = "timeout"
@@ -163,9 +164,27 @@ def governed_execute(task: Any, context: Optional[str] = None, tools: Optional[L
             if tools:
                 tools = self._filter_tools(tools)
 
+            # Check tool call limit before execution
+            if self.policy.max_tool_calls > 0 and self._tool_calls >= self.policy.max_tool_calls:
+                self._record_violation(
+                    ViolationType.TOOL_LIMIT_EXCEEDED,
+                    f"Tool calls ({self._tool_calls}) would exceed limit ({self.policy.max_tool_calls})",
+                )
+
             # Execute with governance
             try:
                 result = original_execute(task, context, tools)
+                
+                # Increment iteration counter
+                self._iterations += 1
+                
+                # Check iteration limit
+                if self.policy.max_iterations > 0 and self._iterations > self.policy.max_iterations:
+                    self._record_violation(
+                        ViolationType.ITERATION_LIMIT_EXCEEDED,
+                        f"Iterations ({self._iterations}) exceeded limit ({self.policy.max_iterations})",
+                    )
+                
                 # Check output for violations
                 result = self._check_output(result, task)
                 return result
@@ -202,6 +221,16 @@ def _filter_tools(self, tools: List[Any]) -> List[Any]:
                 continue
 
             filtered.append(tool)
+            
+            # Track tool call
+            self._tool_calls += 1
+            
+            # Check tool call limit
+            if self.policy.max_tool_calls > 0 and self._tool_calls > self.policy.max_tool_calls:
+                self._record_violation(
+                    ViolationType.TOOL_LIMIT_EXCEEDED,
+                    f"Tool calls ({self._tool_calls}) exceeded limit ({self.policy.max_tool_calls})",
+                )
 
         return filtered
 
@@ -276,11 +305,17 @@ def _log_event(self, event_type: str, **details: Any):
         if not self.policy.log_all_actions:
             return
 
+        # Extract task_name from either 'task_name' key or 'task' object
+        task_name = details.get("task_name")
+        if task_name is None and "task" in details:
+            task_obj = details["task"]
+            task_name = getattr(task_obj, "description", None) or getattr(task_obj, "name", None)
+
         event = AuditEvent(
             event_type=event_type,
             timestamp=datetime.now(timezone.utc),
             agent_name=getattr(self.agent, "role", "unknown"),
-            task_name=details.get("task_name"),
+            task_name=task_name,
             details=details,
         )
         self._audit_log.append(event)
@@ -365,6 +400,12 @@ def kickoff(self, inputs: Optional[Dict[str, Any]] = None) -> Any:
 
         Returns:
             Crew execution result.
+            
+        Note:
+            The max_execution_time check is performed after execution completes
+            and records a violation for audit purposes. For real-time timeout
+            enforcement, implement async execution with asyncio.timeout or
+            similar mechanisms at the application level.
         """
         self._log_event("crew_started", inputs=inputs)
         start_time = time.time()
@@ -372,7 +413,7 @@ def kickoff(self, inputs: Optional[Dict[str, Any]] = None) -> Any:
         try:
             result = self.crew.kickoff(inputs=inputs)
 
-            # Check execution time
+            # Check execution time (audit-only - records violation post-execution)
             elapsed = time.time() - start_time
             if elapsed > self.policy.max_execution_time:
                 self._record_violation(
@@ -406,6 +447,14 @@ def _record_violation(
         if self.on_violation:
             self.on_violation(violation)
 
+        # Log crew-level violations to audit trail
+        self._log_event(
+            "violation",
+            violation_type=violation_type.value,
+            description=description,
+            **details,
+        )
+
     def _log_event(self, event_type: str, **details: Any):
         """Log audit event."""
         if not self.policy.log_all_actions:

From 42793788a073c5ecefa99fa8329313ff56d62cd5 Mon Sep 17 00:00:00 2001
From: Imran Siddique <imran.siddique@microsoft.com>
Date: Fri, 6 Feb 2026 20:21:51 -0800
Subject: [PATCH 4/4] fix: Preserve original type for non-string outputs in
 content filter

The _check_output method was returning a string for non-string outputs
when violations were detected, which broke downstream consumers expecting
specific types (e.g., TaskOutput). Now returns the original object while
logging a warning. Violations are still recorded and can be retrieved
via get_violations().

Fixes review comment about return type breaking downstream consumers.
---
 src/crewai/governance/_kernel.py | 18 ++++++++++++++----
 1 file changed, 14 insertions(+), 4 deletions(-)

diff --git a/src/crewai/governance/_kernel.py b/src/crewai/governance/_kernel.py
index 46f4b96005..554c6cc93c 100644
--- a/src/crewai/governance/_kernel.py
+++ b/src/crewai/governance/_kernel.py
@@ -238,8 +238,9 @@ def _check_output(self, output: Any, task: Any) -> Any:
         """Check output for policy violations.
         
         Note: For non-string outputs, violations are detected and logged,
-        but the original object is returned. To fully sanitize complex
-        objects, serialize them first.
+        but the original object is returned to preserve type compatibility.
+        Violations can be retrieved via get_violations(). For string outputs,
+        blocked content is replaced with [BLOCKED] and length is truncated.
         """
         if output is None:
             return output
@@ -271,8 +272,17 @@ def _check_output(self, output: Any, task: Any) -> Any:
         if isinstance(output, str):
             return output_str
         elif was_modified:
-            # Non-string output with violations - return sanitized string representation
-            return output_str
+            # Non-string output with violations - log warning but return original object
+            # to avoid breaking downstream consumers that expect specific types.
+            # The violation has already been recorded; callers can check get_violations()
+            # if they need to know about content issues.
+            logger.warning(
+                "Content violation detected in non-string output (type: %s). "
+                "Returning original object to preserve type. Violations: %d",
+                type(output).__name__,
+                len(self._violations)
+            )
+            return output
         return output
 
     def _record_violation(