🐛 fix(Traces): Add proper tracing

AI4I-IT · AI4I-IT · commit 5ce94b906eb4 · 2026-01-19T19:09:41.000Z
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
@@ -36,6 +36,8 @@ jobs:
   python-checks:
     name: Linting and Formatting
     runs-on: ubuntu-latest
+    # Skip on main push since PR already validated
+    if: github.event_name == 'pull_request'
     steps:
       - uses: actions/checkout@v6
 
@@ -58,9 +60,11 @@ jobs:
       - name: Run Ruff Formatting Check
         run: uv run ruff format --check .
 
-  test:
+  # Full compatibility matrix - only on PRs to main
+  test-matrix:
     name: Tests (Python ${{ matrix.python-version }}, ${{ matrix.os }})
     runs-on: ${{ matrix.os }}
+    if: github.event_name == 'pull_request' && github.base_ref == 'main'
     strategy:
       fail-fast: false
       matrix:
@@ -87,6 +91,37 @@ jobs:
 
       - name: Upload coverage to Codecov
         if: matrix.os == 'ubuntu-latest' && matrix.python-version == '3.11'
+        uses: codecov/codecov-action@v5
+        with:
+          token: ${{ secrets.CODECOV_TOKEN }}
+          files: reports/coverage.xml
+          fail_ci_if_error: true
+
+  # Quick test - for PRs to non-main branches
+  test-quick:
+    name: Tests (Quick)
+    runs-on: ubuntu-latest
+    if: github.event_name == 'pull_request' && github.base_ref != 'main'
+    steps:
+      - uses: actions/checkout@v6
+
+      - name: Install uv
+        uses: astral-sh/setup-uv@v7
+        with:
+          enable-cache: true
+
+      - name: Set up Python
+        uses: actions/setup-python@v6
+        with:
+          python-version: '3.11'
+
+      - name: Install dependencies
+        run: uv sync --group dev
+
+      - name: Run tests with coverage
+        run: uv run pytest --cov --cov-report=xml:reports/coverage.xml -m "not google_adk"
+
+      - name: Upload coverage to Codecov
         uses: codecov/codecov-action@v5
         with:
           token: ${{ secrets.CODECOV_TOKEN }}
diff --git a/hackagent/attacks/techniques/base.py b/hackagent/attacks/techniques/base.py
@@ -105,8 +105,9 @@ def __init__(
         # This allows subclass to merge with its own defaults first
         self.config = config
 
-        # Run setup
-        self.run_id = self.config.get("run_id")
+        # Run setup - check both "run_id" and "_run_id" for backwards compatibility
+        # The orchestrator passes "_run_id" while direct usage may use "run_id"
+        self.run_id = self.config.get("_run_id") or self.config.get("run_id")
         self.run_dir = self.config.get("output_dir", "./logs/runs")
 
         # Tracking
diff --git a/hackagent/router/router.py b/hackagent/router/router.py
@@ -1082,9 +1082,170 @@ def route_with_tracking(
                     f"⚠️ Result creation failed: status={result_response.status_code}"
                 )
 
+            # Create traces for this result if we have a result_id
+            if result_id:
+                self._create_traces_for_result(
+                    result_id=result_id,
+                    client=client,
+                    request_data=request_data,
+                    response=response,
+                )
+
         except Exception as e:
             logger.error(f"❌ Failed to create Result record: {e}", exc_info=True)
             result_id = None
 
         # Return both response and result_id for tracking
         return {"response": response, "result_id": result_id}
+
+    def _create_traces_for_result(
+        self,
+        result_id: str,
+        client,
+        request_data: Dict[str, Any],
+        response: Any,
+    ) -> None:
+        """
+        Create trace records for a result capturing the agent execution details.
+
+        Args:
+            result_id: The UUID of the result to attach traces to
+            client: Authenticated client for API calls
+            request_data: The original request data sent to the agent
+            response: The response from the agent
+        """
+        from ..api.result import result_trace_create
+        from ..models import TraceRequest, StepTypeEnum
+
+        sequence = 0
+
+        try:
+            result_uuid = UUID(result_id)
+
+            # Trace 1: Capture the user input/request
+            sequence += 1
+            input_trace = TraceRequest(
+                sequence=sequence,
+                step_type=StepTypeEnum.OTHER,
+                content={
+                    "step_name": "User Request",
+                    "messages": request_data.get("messages", []),
+                    "prompt": request_data.get("prompt", ""),
+                },
+            )
+            result_trace_create.sync_detailed(
+                id=result_uuid,
+                client=client,
+                body=input_trace,
+            )
+            logger.debug(f"Created input trace for result {result_id}")
+
+            # Trace 2: Capture tool calls if present
+            if hasattr(response, "tool_calls") and response.tool_calls:
+                for tool_call in response.tool_calls:
+                    sequence += 1
+                    tool_trace = TraceRequest(
+                        sequence=sequence,
+                        step_type=StepTypeEnum.TOOL_CALL,
+                        content={
+                            "step_name": "Tool Call",
+                            "tool_name": tool_call.get("function", {}).get(
+                                "name", "unknown"
+                            )
+                            if isinstance(tool_call, dict)
+                            else getattr(
+                                getattr(tool_call, "function", None), "name", "unknown"
+                            ),
+                            "tool_id": tool_call.get("id", "")
+                            if isinstance(tool_call, dict)
+                            else getattr(tool_call, "id", ""),
+                            "arguments": tool_call.get("function", {}).get(
+                                "arguments", ""
+                            )
+                            if isinstance(tool_call, dict)
+                            else getattr(
+                                getattr(tool_call, "function", None), "arguments", ""
+                            ),
+                        },
+                    )
+                    result_trace_create.sync_detailed(
+                        id=result_uuid,
+                        client=client,
+                        body=tool_trace,
+                    )
+                logger.debug(f"Created {len(response.tool_calls)} tool call traces")
+
+            # Check dict response for tool_calls
+            elif isinstance(response, dict) and response.get("tool_calls"):
+                for tool_call in response["tool_calls"]:
+                    sequence += 1
+                    tool_trace = TraceRequest(
+                        sequence=sequence,
+                        step_type=StepTypeEnum.TOOL_CALL,
+                        content={
+                            "step_name": "Tool Call",
+                            "tool_name": tool_call.get("function", {}).get(
+                                "name", "unknown"
+                            ),
+                            "tool_id": tool_call.get("id", ""),
+                            "arguments": tool_call.get("function", {}).get(
+                                "arguments", ""
+                            ),
+                        },
+                    )
+                    result_trace_create.sync_detailed(
+                        id=result_uuid,
+                        client=client,
+                        body=tool_trace,
+                    )
+                logger.debug(f"Created {len(response['tool_calls'])} tool call traces")
+
+            # Trace 3: Capture the agent response
+            sequence += 1
+            response_content = ""
+            if hasattr(response, "choices") and response.choices:
+                choice = response.choices[0]
+                if hasattr(choice, "message") and choice.message:
+                    response_content = getattr(choice.message, "content", "") or ""
+            elif isinstance(response, dict):
+                if "choices" in response and response["choices"]:
+                    response_content = (
+                        response["choices"][0].get("message", {}).get("content", "")
+                    )
+                elif "generated_text" in response:
+                    response_content = response["generated_text"]
+                elif "content" in response:
+                    response_content = response["content"]
+
+            response_trace = TraceRequest(
+                sequence=sequence,
+                step_type=StepTypeEnum.AGENT_RESPONSE_CHUNK,
+                content={
+                    "step_name": "Agent Response",
+                    "response": response_content[:5000]
+                    if response_content
+                    else "",  # Truncate large responses
+                    "finish_reason": self._extract_finish_reason(response),
+                },
+            )
+            result_trace_create.sync_detailed(
+                id=result_uuid,
+                client=client,
+                body=response_trace,
+            )
+            logger.info(f"✅ Created {sequence} traces for result {result_id}")
+
+        except Exception as e:
+            logger.warning(f"Failed to create traces for result {result_id}: {e}")
+
+    def _extract_finish_reason(self, response: Any) -> str:
+        """Extract finish_reason from response."""
+        if hasattr(response, "choices") and response.choices:
+            choice = response.choices[0]
+            if hasattr(choice, "finish_reason"):
+                return choice.finish_reason or "unknown"
+        elif isinstance(response, dict) and "choices" in response:
+            choices = response.get("choices", [])
+            if choices:
+                return choices[0].get("finish_reason", "unknown")
+        return "unknown"
diff --git a/hackagent/router/tracking/tracker.py b/hackagent/router/tracking/tracker.py
@@ -255,19 +255,39 @@ def _sanitize_config(self, config: Dict[str, Any]) -> Dict[str, Any]:
             Sanitized configuration dictionary
         """
         sensitive_keys = {"api_key", "token", "secret", "password", "key"}
+        # Keys that contain non-serializable objects (like client instances)
+        skip_keys = {"_client", "client"}
 
         sanitized = {}
         for key, value in config.items():
+            # Skip non-serializable objects
+            if key in skip_keys:
+                sanitized[key] = f"<{type(value).__name__}>"
+                continue
+
             key_lower = key.lower()
             if any(sensitive in key_lower for sensitive in sensitive_keys):
                 sanitized[key] = "***REDACTED***"
             elif isinstance(value, dict):
                 sanitized[key] = self._sanitize_config(value)
+            elif not self._is_json_serializable(value):
+                # Skip non-JSON-serializable values
+                sanitized[key] = f"<{type(value).__name__}>"
             else:
                 sanitized[key] = value
 
         return sanitized
 
+    def _is_json_serializable(self, value: Any) -> bool:
+        """Check if a value is JSON serializable."""
+        import json
+
+        try:
+            json.dumps(value)
+            return True
+        except (TypeError, ValueError):
+            return False
+
     def _handle_step_error(self, step_name: str, error_message: str) -> None:
         """
         Update backend with step error information.