From c7f67d383ab8bf9077d54e223a10b974cb6f69fa Mon Sep 17 00:00:00 2001
From: Prince Shakya <princeshakya@Princes-MacBook-Air.local>
Date: Sun, 7 Jun 2026 21:02:14 +0530
Subject: [PATCH 1/3] fix: guardrail webhook payload truncated mid-JSON and
 after_tool skipped for complete_task

- Replace raw byte-slice truncation in GuardrailHookService.invoke() with
  field-level truncation: cap model_output, tool_result, user_message strings
  before serialisation so the body always remains valid JSON.
- Add X-Guardrail-Truncated: true and X-Guardrail-Full-Size: <N> headers
  when truncation occurs so the webhook receiver can detect it explicitly.
- In _run_agent_loop(), invoke the after_tool guardrail hook for complete_task
  before the early return, ensuring every before_tool has a matching after_tool.

Fixes: guardrail HMAC passes on broken JSON body; after_tool never fires for
complete_task tool calls.
---
 finbot/agents/base.py        |   9 +++
 finbot/guardrails/service.py |  35 +++++++++--
 pr_description.md            | 118 +++++++++++++++++++++++++++++++++++
 3 files changed, 158 insertions(+), 4 deletions(-)
 create mode 100644 pr_description.md
diff --git a/finbot/agents/base.py b/finbot/agents/base.py
index 5e4c0480..2b859027 100644
--- a/finbot/agents/base.py
+++ b/finbot/agents/base.py
@@ -166,6 +166,15 @@ async def _run_agent_loop(
                                     )
                                     logger.debug("Function output: %s", function_output)
                                     if tool_call_name == "complete_task":
+                                        # Fire after_tool before returning so every
+                                        # before_tool invocation has a matching after_tool.
+                                        await self._guardrail_service.invoke(
+                                            HookKind.after_tool,
+                                            tool_name=tool_call_name,
+                                            tool_source=tool_source,
+                                            tool_arguments=tool_call.get("arguments"),
+                                            tool_result=str(function_output),
+                                        )
                                         # this will end the agent loop and
                                         # return the task status and summary
                                         await self.log_task_completion(
diff --git a/finbot/guardrails/service.py b/finbot/guardrails/service.py
index dc437e21..a8170236 100644
--- a/finbot/guardrails/service.py
+++ b/finbot/guardrails/service.py
@@ -119,15 +119,39 @@ async def invoke(
         body_bytes = envelope.model_dump_json().encode()
 
         max_payload = settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES
-        if len(body_bytes) > max_payload:
+        was_truncated = False
+        original_size = len(body_bytes)
+
+        if original_size > max_payload:
+            # Truncate at the field level so the body remains valid JSON.
+            # We shorten the large free-text fields iteratively until the
+            # re-serialised envelope fits within the configured limit.
+            was_truncated = True
+            _LARGE_FIELDS = ("model_output", "tool_result", "user_message")
+            budget = max_payload
+
+            envelope_data = envelope.model_dump()
+            for field in _LARGE_FIELDS:
+                if envelope_data.get(field) and len(body_bytes) > budget:
+                    # Estimate how many chars we can keep (1 char ≈ 1–4 bytes);
+                    # use a conservative ratio then iterate to convergence.
+                    current_val: str = envelope_data[field]
+                    overflow = len(body_bytes) - budget
+                    cap = max(0, len(current_val) - overflow)
+                    envelope_data[field] = current_val[:cap]
+                    body_bytes = (
+                        envelope.model_copy(update=envelope_data)
+                        .model_dump_json()
+                        .encode()
+                    )
+
             logger.info(
-                "guardrail payload truncated: %d -> %d bytes, hook=%s tool=%s",
+                "guardrail payload truncated (field-level): %d -> %d bytes, hook=%s tool=%s",
+                original_size,
                 len(body_bytes),
-                max_payload,
                 kind.value,
                 tool_name,
             )
-            body_bytes = body_bytes[:max_payload]
 
         signature = self._sign_payload(body_bytes, config.signing_secret, timestamp)
 
@@ -136,6 +160,9 @@ async def invoke(
             "X-Guardrail-Signature": signature,
             "X-Guardrail-Timestamp": timestamp,
         }
+        if was_truncated:
+            headers["X-Guardrail-Truncated"] = "true"
+            headers["X-Guardrail-Full-Size"] = str(original_size)
 
         start = time.monotonic()
         outcome: HookOutcome
diff --git a/pr_description.md b/pr_description.md
new file mode 100644
index 00000000..03cdc979
--- /dev/null
+++ b/pr_description.md
@@ -0,0 +1,118 @@
+# fix: guardrail webhook sends invalid JSON on large payloads; `after_tool` skipped for `complete_task`
+
+## Summary
+
+This PR fixes two bugs in the FinBot Labs guardrail webhook system:
+
+1. **Payload truncated mid-JSON before signing** — large guardrail hook payloads were being sliced at a raw byte offset, producing invalid JSON that the receiver could not parse, while the HMAC signature continued to validate correctly. The receiver had no way to detect this corruption.
+
+2. **`after_tool` hook never fires for `complete_task`** — the agent loop returned immediately after `complete_task` succeeded, bypassing the corresponding `after_tool` invocation and leaving every `complete_task` call with an unmatched `before_tool` event.
+
+---
+
+## Problem 1 — Payload truncated mid-JSON
+
+### Root Cause
+
+In [`finbot/guardrails/service.py`](finbot/guardrails/service.py), the `invoke()` method serializes the full `HookEnvelope` to JSON bytes and then slices them at `LABS_GUARDRAIL_MAX_PAYLOAD_BYTES`:
+
+```python
+body_bytes = envelope.model_dump_json().encode()
+if len(body_bytes) > max_payload:
+    body_bytes = body_bytes[:max_payload]   # ← raw byte slice, breaks JSON
+signature = self._sign_payload(body_bytes, ...)  # HMAC over broken bytes
+```
+
+A raw byte slice cuts the JSON in the middle of a field value. The result is syntactically invalid JSON (e.g. `..."model_output": "here is the ana`), but because the HMAC is computed over the same truncated bytes, the signature check on the receiver side passes — the corruption is completely invisible to the receiver.
+
+### Fix
+
+Truncation is moved **before serialization**, at the field level:
+
+- Before calling `model_dump_json()`, we compute a tentative payload size.
+- If it would exceed `max_payload`, we cap the long string fields (`model_output`, `tool_result`, `user_message`) inside the envelope so that re-serialization fits within the limit.
+- The signed body is always valid, parseable JSON.
+- Two new headers are added to the webhook request when truncation occurs:
+  - `X-Guardrail-Truncated: true`
+  - `X-Guardrail-Full-Size: <original_byte_count>`
+
+This allows the receiver to detect truncation explicitly rather than hitting a `JSONDecodeError`.
+
+### Files Changed
+
+| File | Change |
+|---|---|
+| [`finbot/guardrails/service.py`](finbot/guardrails/service.py) | Replace raw byte slice with field-level truncation; add `X-Guardrail-Truncated` and `X-Guardrail-Full-Size` headers |
+
+---
+
+## Problem 2 — `after_tool` skipped for `complete_task`
+
+### Root Cause
+
+In [`finbot/agents/base.py`](finbot/agents/base.py), lines 152–189, the `before_tool` guardrail hook fires for every tool call, including `complete_task`. However, when `complete_task` succeeds, the agent loop returns immediately on line 174, **before** the `after_tool` invocation on line 183 is reached:
+
+```python
+await self._guardrail_service.invoke(HookKind.before_tool, ...)  # fires ✓
+
+try:
+    function_output = await callable_fn(**tool_call["arguments"])
+    if tool_call_name == "complete_task":
+        await self.log_task_completion(...)
+        return function_output  # ← returns here, skips after_tool ✗
+
+await self._guardrail_service.invoke(HookKind.after_tool, ...)  # never reached
+```
+
+Any guardrail that tracks paired `before_tool` / `after_tool` events (e.g. to measure tool execution time or audit a tool's output) will see every `complete_task` appear open-ended.
+
+### Fix
+
+The `after_tool` invocation is moved to execute **before** the early return for `complete_task`:
+
+```python
+function_output = await callable_fn(**tool_call["arguments"])
+if tool_call_name == "complete_task":
+    await self._guardrail_service.invoke(        # fires ✓ before return
+        HookKind.after_tool,
+        tool_name=tool_call_name,
+        tool_source=tool_source,
+        tool_arguments=tool_call.get("arguments"),
+        tool_result=str(function_output),
+    )
+    await self.log_task_completion(task_result=function_output)
+    return function_output
+```
+
+### Files Changed
+
+| File | Change |
+|---|---|
+| [`finbot/agents/base.py`](finbot/agents/base.py) | Invoke `after_tool` guardrail hook before the early return for `complete_task` |
+
+---
+
+## Behaviour After This PR
+
+| Scenario | Before | After |
+|---|---|---|
+| Large `after_model` payload exceeds limit | Receiver gets broken JSON; HMAC passes; parse fails silently | Receiver gets valid JSON with long fields truncated; `X-Guardrail-Truncated: true` header present |
+| Large `after_tool` payload exceeds limit | Same as above | Same as above |
+| `complete_task` tool call | `before_tool` fires, `after_tool` never fires | Both `before_tool` and `after_tool` fire |
+| Normal-sized payload | Unchanged | Unchanged |
+
+---
+
+## Testing
+
+- [ ] Set `LABS_GUARDRAIL_MAX_PAYLOAD_BYTES` to a small value (e.g. 500 bytes), trigger a long LLM response, and verify the webhook receives valid JSON with `X-Guardrail-Truncated: true`.
+- [ ] Verify that the HMAC signature validates correctly against the truncated (but valid JSON) body.
+- [ ] Trigger an agent run that finishes via `complete_task` and confirm both `before_tool` and `after_tool` events appear in the activity log for that call.
+- [ ] Trigger a normal tool call (non-`complete_task`) and confirm no regression in `after_tool` behaviour.
+
+---
+
+## Affected Files
+
+- [`finbot/guardrails/service.py`](finbot/guardrails/service.py) — `invoke()`, payload truncation logic (lines 119–132)
+- [`finbot/agents/base.py`](finbot/agents/base.py) — `_run_agent_loop()`, `after_tool` hook for `complete_task` (lines 168–174)

From 4f464244762dff3737dccc3d4c6e79881301d921 Mon Sep 17 00:00:00 2001
From: Prince Shakya <psprince2005@gmail.com>
Date: Sun, 7 Jun 2026 21:04:31 +0530
Subject: [PATCH 2/3] Delete pr_description.md

Signed-off-by: Prince Shakya <psprince2005@gmail.com>
---
 pr_description.md | 118 ----------------------------------------------
 1 file changed, 118 deletions(-)
 delete mode 100644 pr_description.md

diff --git a/pr_description.md b/pr_description.md
deleted file mode 100644
index 03cdc979..00000000
--- a/pr_description.md
+++ /dev/null
@@ -1,118 +0,0 @@
-# fix: guardrail webhook sends invalid JSON on large payloads; `after_tool` skipped for `complete_task`
-
-## Summary
-
-This PR fixes two bugs in the FinBot Labs guardrail webhook system:
-
-1. **Payload truncated mid-JSON before signing** — large guardrail hook payloads were being sliced at a raw byte offset, producing invalid JSON that the receiver could not parse, while the HMAC signature continued to validate correctly. The receiver had no way to detect this corruption.
-
-2. **`after_tool` hook never fires for `complete_task`** — the agent loop returned immediately after `complete_task` succeeded, bypassing the corresponding `after_tool` invocation and leaving every `complete_task` call with an unmatched `before_tool` event.
-
----
-
-## Problem 1 — Payload truncated mid-JSON
-
-### Root Cause
-
-In [`finbot/guardrails/service.py`](finbot/guardrails/service.py), the `invoke()` method serializes the full `HookEnvelope` to JSON bytes and then slices them at `LABS_GUARDRAIL_MAX_PAYLOAD_BYTES`:
-
-```python
-body_bytes = envelope.model_dump_json().encode()
-if len(body_bytes) > max_payload:
-    body_bytes = body_bytes[:max_payload]   # ← raw byte slice, breaks JSON
-signature = self._sign_payload(body_bytes, ...)  # HMAC over broken bytes
-```
-
-A raw byte slice cuts the JSON in the middle of a field value. The result is syntactically invalid JSON (e.g. `..."model_output": "here is the ana`), but because the HMAC is computed over the same truncated bytes, the signature check on the receiver side passes — the corruption is completely invisible to the receiver.
-
-### Fix
-
-Truncation is moved **before serialization**, at the field level:
-
-- Before calling `model_dump_json()`, we compute a tentative payload size.
-- If it would exceed `max_payload`, we cap the long string fields (`model_output`, `tool_result`, `user_message`) inside the envelope so that re-serialization fits within the limit.
-- The signed body is always valid, parseable JSON.
-- Two new headers are added to the webhook request when truncation occurs:
-  - `X-Guardrail-Truncated: true`
-  - `X-Guardrail-Full-Size: <original_byte_count>`
-
-This allows the receiver to detect truncation explicitly rather than hitting a `JSONDecodeError`.
-
-### Files Changed
-
-| File | Change |
-|---|---|
-| [`finbot/guardrails/service.py`](finbot/guardrails/service.py) | Replace raw byte slice with field-level truncation; add `X-Guardrail-Truncated` and `X-Guardrail-Full-Size` headers |
-
----
-
-## Problem 2 — `after_tool` skipped for `complete_task`
-
-### Root Cause
-
-In [`finbot/agents/base.py`](finbot/agents/base.py), lines 152–189, the `before_tool` guardrail hook fires for every tool call, including `complete_task`. However, when `complete_task` succeeds, the agent loop returns immediately on line 174, **before** the `after_tool` invocation on line 183 is reached:
-
-```python
-await self._guardrail_service.invoke(HookKind.before_tool, ...)  # fires ✓
-
-try:
-    function_output = await callable_fn(**tool_call["arguments"])
-    if tool_call_name == "complete_task":
-        await self.log_task_completion(...)
-        return function_output  # ← returns here, skips after_tool ✗
-
-await self._guardrail_service.invoke(HookKind.after_tool, ...)  # never reached
-```
-
-Any guardrail that tracks paired `before_tool` / `after_tool` events (e.g. to measure tool execution time or audit a tool's output) will see every `complete_task` appear open-ended.
-
-### Fix
-
-The `after_tool` invocation is moved to execute **before** the early return for `complete_task`:
-
-```python
-function_output = await callable_fn(**tool_call["arguments"])
-if tool_call_name == "complete_task":
-    await self._guardrail_service.invoke(        # fires ✓ before return
-        HookKind.after_tool,
-        tool_name=tool_call_name,
-        tool_source=tool_source,
-        tool_arguments=tool_call.get("arguments"),
-        tool_result=str(function_output),
-    )
-    await self.log_task_completion(task_result=function_output)
-    return function_output
-```
-
-### Files Changed
-
-| File | Change |
-|---|---|
-| [`finbot/agents/base.py`](finbot/agents/base.py) | Invoke `after_tool` guardrail hook before the early return for `complete_task` |
-
----
-
-## Behaviour After This PR
-
-| Scenario | Before | After |
-|---|---|---|
-| Large `after_model` payload exceeds limit | Receiver gets broken JSON; HMAC passes; parse fails silently | Receiver gets valid JSON with long fields truncated; `X-Guardrail-Truncated: true` header present |
-| Large `after_tool` payload exceeds limit | Same as above | Same as above |
-| `complete_task` tool call | `before_tool` fires, `after_tool` never fires | Both `before_tool` and `after_tool` fire |
-| Normal-sized payload | Unchanged | Unchanged |
-
----
-
-## Testing
-
-- [ ] Set `LABS_GUARDRAIL_MAX_PAYLOAD_BYTES` to a small value (e.g. 500 bytes), trigger a long LLM response, and verify the webhook receives valid JSON with `X-Guardrail-Truncated: true`.
-- [ ] Verify that the HMAC signature validates correctly against the truncated (but valid JSON) body.
-- [ ] Trigger an agent run that finishes via `complete_task` and confirm both `before_tool` and `after_tool` events appear in the activity log for that call.
-- [ ] Trigger a normal tool call (non-`complete_task`) and confirm no regression in `after_tool` behaviour.
-
----
-
-## Affected Files
-
-- [`finbot/guardrails/service.py`](finbot/guardrails/service.py) — `invoke()`, payload truncation logic (lines 119–132)
-- [`finbot/agents/base.py`](finbot/agents/base.py) — `_run_agent_loop()`, `after_tool` hook for `complete_task` (lines 168–174)

From b5299e00a0f84643b89cd0350c67999edb316e24 Mon Sep 17 00:00:00 2001
From: Prince Shakya <princeshakya@Princes-MacBook-Air.local>
Date: Sun, 7 Jun 2026 21:09:02 +0530
Subject: [PATCH 3/3] test: add unit tests for guardrail payload truncation and
 after_tool hook pairing

- GWT-TRN-001: large payload truncated at field level, body remains valid JSON
- GWT-TRN-002: normal-sized payload is sent unchanged, no truncation headers
- GWT-TRN-003: X-Guardrail-Truncated / X-Guardrail-Full-Size headers set on truncation
- GWT-TRN-004: HMAC signature is computed over the valid (post-truncation) body
- GWT-ATL-001: after_tool guardrail hook fires for complete_task before early return
---
 .../test_guardrail_truncation_and_hooks.py    | 337 ++++++++++++++++++
 1 file changed, 337 insertions(+)
 create mode 100644 tests/unit/labs/test_guardrail_truncation_and_hooks.py

diff --git a/tests/unit/labs/test_guardrail_truncation_and_hooks.py b/tests/unit/labs/test_guardrail_truncation_and_hooks.py
new file mode 100644
index 00000000..1ad99130
--- /dev/null
+++ b/tests/unit/labs/test_guardrail_truncation_and_hooks.py
@@ -0,0 +1,337 @@
+"""Tests for guardrail webhook payload truncation fix and after_tool completeness.
+
+Covers:
+  GWT-TRN-001: Large payload is truncated at field level (body remains valid JSON)
+  GWT-TRN-002: Normal-sized payload is sent unchanged (no truncation headers)
+  GWT-TRN-003: X-Guardrail-Truncated and X-Guardrail-Full-Size headers are set on truncation
+  GWT-TRN-004: HMAC signature is computed over valid (post-truncation) JSON body
+  GWT-ATL-001: after_tool guardrail hook fires for complete_task before early return
+"""
+
+import hashlib
+import hmac
+import json
+from typing import Any, Callable
+from unittest.mock import AsyncMock, MagicMock, patch
+
+import httpx
+import pytest
+
+from finbot.config import settings
+from finbot.guardrails.schemas import HookKind, HookOutcome
+from finbot.guardrails.service import GuardrailHookService
+
+
+# =============================================================================
+# Fixtures
+# =============================================================================
+
+
+@pytest.fixture()
+def session(db):
+    """Create a session context for guardrail tests."""
+    from finbot.core.auth.session import session_manager
+
+    return session_manager.create_session(email="guardrail_trunc@example.com")
+
+
+@pytest.fixture()
+def config_repo(db, session):
+    """Ensure a guardrail config with all hooks enabled exists."""
+    from finbot.core.data.repositories import LabsGuardrailConfigRepository
+
+    repo = LabsGuardrailConfigRepository(db, session)
+    repo.upsert(
+        webhook_url="https://example.com/hook",
+        timeout_seconds=5,
+        hooks={
+            "before_tool": True,
+            "after_tool": True,
+            "before_model": True,
+            "after_model": True,
+        },
+    )
+    return repo
+
+
+@pytest.fixture()
+def service(session, config_repo):
+    """GuardrailHookService wired to an active config."""
+    return GuardrailHookService(session_context=session, workflow_id="wf_test_trunc")
+
+
+# =============================================================================
+# GWT-TRN: Payload Truncation
+# =============================================================================
+
+
+class TestPayloadTruncation:
+    """Tests that verify the field-level truncation of large guardrail payloads."""
+
+    @pytest.mark.asyncio
+    @patch("finbot.guardrails.service.event_bus")
+    async def test_gwt_trn_001_large_payload_body_is_valid_json(
+        self, mock_bus, service
+    ):
+        """GWT-TRN-001: Large payload truncated at field level — body is valid JSON.
+
+        When the serialised envelope exceeds LABS_GUARDRAIL_MAX_PAYLOAD_BYTES,
+        the service MUST cap string fields before serialisation so the webhook
+        receiver always gets parseable JSON.
+        """
+        mock_bus.emit_agent_event = AsyncMock()
+
+        original_limit = settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES
+        settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES = 500
+
+        try:
+            large_output = "X" * 1000  # forces truncation
+
+            resp = httpx.Response(200, json={"verdict": "allow"})
+            with patch(
+                "httpx.AsyncClient.post", new_callable=AsyncMock, return_value=resp
+            ) as mock_post:
+                outcome = await service.invoke(
+                    HookKind.after_model,
+                    model="gpt-4",
+                    model_output=large_output,
+                )
+
+            assert outcome == HookOutcome.completed
+
+            call_kwargs = mock_post.call_args.kwargs
+            body: bytes = call_kwargs["content"]
+
+            # Body MUST be parseable JSON
+            try:
+                parsed = json.loads(body.decode())
+            except json.JSONDecodeError as exc:
+                pytest.fail(f"Webhook body is not valid JSON after truncation: {exc}")
+
+            # The model_output field must be present but shorter than the original
+            assert "model_output" in parsed
+            assert len(parsed["model_output"]) < len(large_output), (
+                "model_output was not truncated"
+            )
+
+        finally:
+            settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES = original_limit
+
+    @pytest.mark.asyncio
+    @patch("finbot.guardrails.service.event_bus")
+    async def test_gwt_trn_002_normal_payload_not_truncated(self, mock_bus, service):
+        """GWT-TRN-002: Normal-sized payload is sent unchanged without truncation headers."""
+        mock_bus.emit_agent_event = AsyncMock()
+
+        original_limit = settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES
+        settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES = 100_000  # very large limit
+
+        try:
+            small_output = "short response"
+
+            resp = httpx.Response(200, json={"verdict": "allow"})
+            with patch(
+                "httpx.AsyncClient.post", new_callable=AsyncMock, return_value=resp
+            ) as mock_post:
+                await service.invoke(
+                    HookKind.after_model,
+                    model="gpt-4",
+                    model_output=small_output,
+                )
+
+            call_kwargs = mock_post.call_args.kwargs
+            headers = call_kwargs["headers"]
+
+            assert "X-Guardrail-Truncated" not in headers, (
+                "Truncation header present for a payload that did not need truncation"
+            )
+            assert "X-Guardrail-Full-Size" not in headers
+
+        finally:
+            settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES = original_limit
+
+    @pytest.mark.asyncio
+    @patch("finbot.guardrails.service.event_bus")
+    async def test_gwt_trn_003_truncation_headers_present_when_truncated(
+        self, mock_bus, service
+    ):
+        """GWT-TRN-003: X-Guardrail-Truncated and X-Guardrail-Full-Size headers set on truncation."""
+        mock_bus.emit_agent_event = AsyncMock()
+
+        original_limit = settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES
+        settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES = 500
+
+        try:
+            resp = httpx.Response(200, json={"verdict": "allow"})
+            with patch(
+                "httpx.AsyncClient.post", new_callable=AsyncMock, return_value=resp
+            ) as mock_post:
+                await service.invoke(
+                    HookKind.after_model,
+                    model="gpt-4",
+                    model_output="Y" * 1000,
+                )
+
+            call_kwargs = mock_post.call_args.kwargs
+            headers = call_kwargs["headers"]
+            body: bytes = call_kwargs["content"]
+
+            assert "X-Guardrail-Truncated" in headers, "Missing X-Guardrail-Truncated"
+            assert headers["X-Guardrail-Truncated"] == "true"
+
+            assert "X-Guardrail-Full-Size" in headers, "Missing X-Guardrail-Full-Size"
+            full_size = int(headers["X-Guardrail-Full-Size"])
+            assert full_size > len(body), (
+                "X-Guardrail-Full-Size should be larger than the truncated body length"
+            )
+
+        finally:
+            settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES = original_limit
+
+    @pytest.mark.asyncio
+    @patch("finbot.guardrails.service.event_bus")
+    async def test_gwt_trn_004_hmac_computed_over_truncated_valid_json(
+        self, mock_bus, service
+    ):
+        """GWT-TRN-004: HMAC signature is computed over the (valid-JSON) truncated body."""
+        mock_bus.emit_agent_event = AsyncMock()
+
+        original_limit = settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES
+        settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES = 500
+
+        try:
+            resp = httpx.Response(200, json={"verdict": "allow"})
+            with patch(
+                "httpx.AsyncClient.post", new_callable=AsyncMock, return_value=resp
+            ) as mock_post:
+                await service.invoke(
+                    HookKind.after_model,
+                    model="gpt-4",
+                    model_output="Z" * 1000,
+                )
+
+            call_kwargs = mock_post.call_args.kwargs
+            body: bytes = call_kwargs["content"]
+            headers = call_kwargs["headers"]
+
+            timestamp = headers["X-Guardrail-Timestamp"]
+            received_sig = headers["X-Guardrail-Signature"]
+
+            # Load the signing secret directly from the config
+            config = service._load_config()
+            expected_msg = f"{timestamp}.".encode() + body
+            expected_sig = hmac.new(
+                config.signing_secret.encode(), expected_msg, hashlib.sha256
+            ).hexdigest()
+
+            assert received_sig == expected_sig, (
+                "HMAC signature does not match signature over the truncated body"
+            )
+
+        finally:
+            settings.LABS_GUARDRAIL_MAX_PAYLOAD_BYTES = original_limit
+
+
+# =============================================================================
+# GWT-ATL: after_tool fired for complete_task
+# =============================================================================
+
+
+class TestAfterToolOnCompleteTask:
+    """Tests that the after_tool guardrail hook is fired for complete_task."""
+
+    @pytest.mark.asyncio
+    @patch("finbot.guardrails.service.event_bus")
+    async def test_gwt_atl_001_after_tool_fires_for_complete_task(
+        self, mock_bus, session
+    ):
+        """GWT-ATL-001: after_tool hook fires for complete_task before the agent loop exits.
+
+        Before the fix, the agent returned immediately after complete_task
+        succeeded, skipping the after_tool invocation entirely and leaving
+        an unmatched before_tool event.
+        """
+        from finbot.agents.base import BaseAgent
+
+        mock_bus.emit_agent_event = AsyncMock()
+        mock_bus.set_workflow_context = MagicMock()
+        mock_bus.clear_workflow_context = MagicMock()
+
+        hook_calls: list[tuple[HookKind, str | None]] = []
+
+        async def _mock_invoke(kind: HookKind, **kwargs):
+            hook_calls.append((kind, kwargs.get("tool_name")))
+            return HookOutcome.no_config
+
+        # Build a minimal concrete agent
+        class MinimalAgent(BaseAgent):
+            def _load_config(self):
+                return {}
+
+            def _get_system_prompt(self):
+                return "test"
+
+            async def _get_user_prompt(self, task_data=None):
+                return "do the task"
+
+            def _get_tool_definitions(self):
+                return []
+
+            def _get_callables(self):
+                return {}
+
+            async def process(self, task_data, **kwargs):
+                return await self._run_agent_loop(task_data)
+
+        agent = MinimalAgent(session_context=session)
+        # Patch the guardrail service on this instance
+        agent._guardrail_service.invoke = _mock_invoke
+
+        # Patch MCP server connection (no-op)
+        agent._connect_mcp_servers = AsyncMock()
+        agent._disconnect_mcp_servers = AsyncMock()
+
+        # Simulate LLM returning a single complete_task tool call
+        fake_tool_call = {
+            "name": "complete_task",
+            "call_id": "call_001",
+            "arguments": {
+                "task_status": "success",
+                "task_summary": "All done",
+            },
+        }
+        mock_response = MagicMock()
+        mock_response.content = None
+        mock_response.tool_calls = [fake_tool_call]
+        mock_response.messages = []
+
+        agent.llm_client = MagicMock()
+        agent.llm_client.chat = AsyncMock(return_value=mock_response)
+
+        # Run the agent loop
+        result = await agent._run_agent_loop(task_data={})
+
+        assert result["task_status"] == "success"
+
+        # Both before_tool and after_tool must have been called for complete_task
+        before_calls = [
+            (k, t)
+            for k, t in hook_calls
+            if k == HookKind.before_tool and t == "complete_task"
+        ]
+        after_calls = [
+            (k, t)
+            for k, t in hook_calls
+            if k == HookKind.after_tool and t == "complete_task"
+        ]
+
+        assert len(before_calls) >= 1, (
+            "before_tool was not called for complete_task"
+        )
+        assert len(after_calls) >= 1, (
+            "after_tool was never called for complete_task — hook is unpaired"
+        )
+        assert len(before_calls) == len(after_calls), (
+            f"Unmatched before_tool/after_tool pairs: "
+            f"{len(before_calls)} before vs {len(after_calls)} after"
+        )