ory · aeneasr · Mar 3, 2026 · Mar 2, 2026 · Mar 2, 2026 · Mar 2, 2026
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
@@ -72,5 +72,5 @@ jobs:
         run: make e2e
         env:
           OLLAMA_HOST: http://localhost:11434
-          AGENT_INDEX_EMBED_MODEL: all-minilm
-          AGENT_INDEX_EMBED_DIMS: '384'
+          LUMEN_EMBED_MODEL: all-minilm
+          LUMEN_EMBED_DIMS: '384'
diff --git a/.gitignore b/.gitignore
@@ -1,11 +1,10 @@
 # Binary
-agent-index
-agent-index
+lumen
 
 # IDE
 .idea/
 .vscode/
 *.swp
 
 # OS
-.DS_Store
+.DS_Store
diff --git a/.golangci.yml b/.golangci.yml
@@ -4,4 +4,4 @@ run:
   timeout: 5m
 
 linters:
-  default: all
+  default: standard
diff --git a/CLAUDE.md b/CLAUDE.md
diff --git a/Makefile b/Makefile
@@ -1,4 +1,4 @@
-BINARY   := agent-index
+BINARY   := lumen
 GO       := go
 GOTAGS   := fts5
 GOFLAGS  := -tags=$(GOTAGS)
@@ -15,7 +15,7 @@ install:
 	CGO_ENABLED=1 $(GO) install $(GOFLAGS) ./...
 
 e2e:
-	CGO_ENABLED=1 $(GO) test -tags=$(GOTAGS),e2e -timeout=5m -v -count=1 ./...
+	CGO_ENABLED=1 $(GO) test -tags=$(GOTAGS),e2e -timeout=20m -v -count=1 ./...
 
 lint:
 	golangci-lint run

diff --git a/README.md b/README.md
diff --git a/bench-mcp.sh b/bench-mcp.sh
@@ -1,53 +1,41 @@
 #!/usr/bin/env bash
-# bench-mcp.sh — benchmark baseline vs agent-index MCP across questions and models
+# bench-mcp.sh — benchmark baseline vs lumen MCP across questions and models
 set -eufo pipefail
 
 REPO="$(cd "$(dirname "$0")" && pwd)"
 FIXTURES_GO="$REPO/testdata/fixtures/go"
 FIXTURES_PY="$REPO/testdata/fixtures/python"
 FIXTURES_TS="$REPO/testdata/fixtures/ts"
-BINARY="$REPO/agent-index"
+BINARY="$REPO/lumen"
 
-# ── Questions (3 languages × 3 difficulty levels) ────────────────────────────
+# ── Questions (3 languages × 1 hard question each) ───────────────────────────
 QUESTIONS=(
   # Go (Prometheus fixtures)
-  "What label matcher types are available and how is a Matcher created? Show the type definitions and constructor."
-  "How does histogram bucket counting work? Show me the relevant function signatures."
   "How does TSDB compaction work end-to-end? Explain the Compactor interface, LeveledCompactor, and how the DB triggers compaction. Show relevant types, interfaces, and key method signatures."
   # Python (Django + Flask fixtures)
-  "How does the Django Permission model work? Show the Permission class, its fields, the PermissionManager, and the get_by_natural_key method."
-  "How does Flask configuration loading work? Explain the Config class, how it loads from files, environment variables, and Python objects. Show the key methods and class hierarchy."
   "How does the Django QuerySet evaluation and filtering pipeline work? Explain QuerySet chaining, lazy evaluation, the Query class, how lookups and filters are compiled into SQL, and how the Manager ties it all together. Show key classes and method signatures."
   # TypeScript (VSCode base library fixtures)
-  "What is the IDisposable interface and how does the Disposable base class work? Show the interface, the base class, and how DisposableStore manages multiple disposables."
-  "How does the event emitter system work? Explain the Event interface, the Emitter class, event composition (map, filter, debounce), and how events integrate with disposables. Show key types and patterns."
   "How do async operations, cancellation, and resource lifecycle management work together? Explain CancelablePromise, CancellationToken, the async utilities (throttle, debounce, retry), how they integrate with the disposable lifecycle system, and how event-driven patterns compose with async flows. Show key interfaces and class relationships."
 )
 Q_SLUGS=(
-  "go-label-matcher"
-  "go-histogram"
   "go-tsdb-compaction"
-  "py-permissions"
-  "py-flask-config"
   "py-django-queryset"
-  "ts-disposable"
-  "ts-event-emitter"
   "ts-async-lifecycle"
 )
 Q_LANG=(
-  "go" "go" "go"
-  "python" "python" "python"
-  "typescript" "typescript" "typescript"
+  "go"
+  "python"
+  "typescript"
 )
 Q_FIXTURES=(
-  "$FIXTURES_GO" "$FIXTURES_GO" "$FIXTURES_GO"
-  "$FIXTURES_PY" "$FIXTURES_PY" "$FIXTURES_PY"
-  "$FIXTURES_TS" "$FIXTURES_TS" "$FIXTURES_TS"
+  "$FIXTURES_GO"
+  "$FIXTURES_PY"
+  "$FIXTURES_TS"
 )
 Q_DIFFICULTY=(
-  "easy" "medium" "hard"
-  "easy" "medium" "hard"
-  "easy" "medium" "hard"
+  "hard"
+  "hard"
+  "hard"
 )
 
 # ── Models ────────────────────────────────────────────────────────────────────
@@ -96,14 +84,14 @@ for i in "${!Q_SLUGS[@]}"; do
 done
 
 # ── Build ──────────────────────────────────────────────────────────────────────
-echo "Building agent-index..."
-CGO_ENABLED=1 go build -o agent-index .
+echo "Building lumen..."
+CGO_ENABLED=1 go build -o lumen .
 
 # ── Index ─────────────────────────────────────────────────────────────────────
 echo "Indexing fixtures..."
 for fx_dir in "$FIXTURES_GO" "$FIXTURES_PY" "$FIXTURES_TS"; do
-  AGENT_INDEX_BACKEND="$EMBED_BACKEND" AGENT_INDEX_EMBED_MODEL="$EMBED_MODEL" \
-    ./agent-index index "$fx_dir" 2>&1 | tail -1
+  LUMEN_BACKEND="$EMBED_BACKEND" LUMEN_EMBED_MODEL="$EMBED_MODEL" \
+    ./lumen index "$fx_dir" 2>&1 | tail -1
 done
 
 # ── MCP configs ───────────────────────────────────────────────────────────────
@@ -112,7 +100,7 @@ MCP_EMPTY=$(mktemp /tmp/bench-mcp-empty-XXXXXX).json
 trap 'rm -f "$MCP_ENABLED" "$MCP_EMPTY"' EXIT
 
 cat > "$MCP_ENABLED" <<EOF
-{"mcpServers":{"agent-index":{"command":"$BINARY","args":["stdio"],"env":{"AGENT_INDEX_BACKEND":"$EMBED_BACKEND","AGENT_INDEX_EMBED_MODEL":"$EMBED_MODEL"}}}}
+{"mcpServers":{"lumen":{"command":"$BINARY","args":["stdio"],"env":{"LUMEN_BACKEND":"$EMBED_BACKEND","LUMEN_EMBED_MODEL":"$EMBED_MODEL"}}}}
 EOF
 echo '{"mcpServers":{}}' > "$MCP_EMPTY"
 
@@ -136,12 +124,13 @@ run() {
   [[ -n "$disable_builtin_tools" ]] && tools_arg=(--tools "")
 
   local allowed_tools_arg=()
-  [[ "$mcp_cfg" == "$MCP_ENABLED" ]] && allowed_tools_arg=(--allowedTools "mcp__agent-index__semantic_search,mcp__agent-index__index_status")
+  [[ "$mcp_cfg" == "$MCP_ENABLED" ]] && allowed_tools_arg=(--allowedTools "mcp__lumen__semantic_search,mcp__lumen__index_status")
 
-  DISABLE_PROMPT_CACHING=1 claude \
+  claude \
     --output-format stream-json \
     --verbose \
     --model "$model" \
+    --effort medium \
     --strict-mcp-config \
     --mcp-config "$mcp_cfg" \
     ${tools_arg[@]:+"${tools_arg[@]}"} \
@@ -229,7 +218,7 @@ $(cat "$af")
   printf "  Judging %-28s ... " "$slug"
 
   # Brief verdict for summary (content quality + efficiency)
-  claude -p --model claude-opus-4-6 \
+  claude -p --model claude-opus-4-6 --effort medium \
     "You are a judge evaluating AI answers to a codebase question. Be concise.
 
 Question: $question
@@ -254,7 +243,7 @@ Example: **Winner: sonnet/mcp-only**" \
     > "$judge_brief_file" 2>&1 || echo "_Judge unavailable_" > "$judge_brief_file"
 
   # Detailed analysis for detail report
-  claude -p --model claude-opus-4-6 \
+  claude -p --model claude-opus-4-6 --effort medium \
     "You are a judge evaluating AI answers to a question about a codebase.
 
 Question: $question

diff --git a/cmd/embedder.go b/cmd/embedder.go
@@ -17,8 +17,8 @@ package cmd
 import (
 	"fmt"
 
-	"github.com/aeneasr/agent-index/internal/config"
-	"github.com/aeneasr/agent-index/internal/embedder"
+	"github.com/aeneasr/lumen/internal/config"
+	"github.com/aeneasr/lumen/internal/embedder"
 )
 
 // newEmbedder creates an Embedder based on the configured backend.

diff --git a/cmd/hook.go b/cmd/hook.go
@@ -0,0 +1,93 @@
+// Copyright 2026 Aeneas Rekkas
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package cmd
+
+import (
+	"encoding/json"
+	"fmt"
+	"os"
+	"path/filepath"
+
+	"github.com/spf13/cobra"
+)
+
+func init() {
+	rootCmd.AddCommand(hookCmd)
+	hookCmd.AddCommand(hookSessionStartCmd)
+}
+
+var hookCmd = &cobra.Command{
+	Use:   "hook",
+	Short: "Hook handlers for AI coding agent integration",
+}
+
+var hookSessionStartCmd = &cobra.Command{
+	Use:   "session-start [mcp-name]",
+	Short: "Output SessionStart hook JSON for Claude Code",
+	Args:  cobra.MaximumNArgs(1),
+	RunE:  runHookSessionStart,
+}
+
+// hookOutput is the JSON structure Claude Code expects from a synchronous hook.
+type hookOutput struct {
+	HookSpecificOutput hookSpecificOutput `json:"hookSpecificOutput"`
+}
+
+type hookSpecificOutput struct {
+	HookEventName     string `json:"hookEventName"`
+	AdditionalContext string `json:"additionalContext"`
+}
+
+func runHookSessionStart(_ *cobra.Command, args []string) error {
+	mcpName := filepath.Base(os.Args[0])
+	if len(args) > 0 {
+		mcpName = args[0]
+	}
+
+	content := generateHookContent(mcpName)
+
+	out := hookOutput{
+		HookSpecificOutput: hookSpecificOutput{
+			HookEventName:     "SessionStart",
+			AdditionalContext: content,
+		},
+	}
+
+	enc := json.NewEncoder(os.Stdout)
+	enc.SetEscapeHTML(false)
+	return enc.Encode(out)
+}
+
+// generateHookContent builds the EXTREMELY_IMPORTANT-wrapped directive for the
+// SessionStart hook. This is a stronger version of generateSnippet designed to
+// achieve near-100% tool trigger rate.
+func generateHookContent(mcpName string) string {
+	toolRef := "`mcp__" + mcpName + "__semantic_search`"
+	return "<EXTREMELY_IMPORTANT>\n" +
+		"# Lumen Semantic Search\n\n" +
+		"ALWAYS use " + toolRef + " as the FIRST tool for code discovery.\n\n" +
+		"Before using Grep, Glob, Find, or Read for any search, stop and ask:\n" +
+		"\"Do I already know the exact literal string I'm searching for?\"\n" +
+		"If not, use " + toolRef + ".\n\n" +
+		"## Red Flags — if you think any of these, STOP:\n" +
+		"| Thought | Reality |\n" +
+		"|---------|--------|\n" +
+		fmt.Sprintf("| \"I'll just grep quickly\" | %s is faster for discovery |\n", toolRef) +
+		"| \"I know the file name\" | You might not know the best match |\n" +
+		"| \"Glob is faster for this\" | Only if you have an exact filename pattern |\n" +
+		"| \"This is a simple search\" | Simple searches benefit most from semantic |\n\n" +
+		"If semantic search is unavailable, Grep/Glob are acceptable fallbacks.\n" +
+		"</EXTREMELY_IMPORTANT>"
+}
diff --git a/cmd/hook_test.go b/cmd/hook_test.go
@@ -0,0 +1,81 @@
+// Copyright 2026 Aeneas Rekkas
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package cmd
+
+import (
+	"encoding/json"
+	"strings"
+	"testing"
+)
+
+func TestGenerateHookContent(t *testing.T) {
+	cases := []struct {
+		mcpName string
+		wantRef string
+	}{
+		{"lumen", "mcp__lumen__semantic_search"},
+		{"my-custom-server", "mcp__my-custom-server__semantic_search"},
+	}
+
+	for _, tc := range cases {
+		t.Run(tc.mcpName, func(t *testing.T) {
+			content := generateHookContent(tc.mcpName)
+			if !strings.HasPrefix(content, "<EXTREMELY_IMPORTANT>") {
+				t.Error("content should start with <EXTREMELY_IMPORTANT>")
+			}
+			if !strings.HasSuffix(content, "</EXTREMELY_IMPORTANT>") {
+				t.Error("content should end with </EXTREMELY_IMPORTANT>")
+			}
+			if !strings.Contains(content, tc.wantRef) {
+				t.Errorf("expected %q in content, got: %s", tc.wantRef, content)
+			}
+			if !strings.Contains(content, "Red Flags") {
+				t.Error("content should contain rationalization-blocking table")
+			}
+		})
+	}
+}
+
+func TestHookOutputJSON(t *testing.T) {
+	content := generateHookContent("lumen")
+	out := hookOutput{
+		HookSpecificOutput: hookSpecificOutput{
+			HookEventName:     "SessionStart",
+			AdditionalContext: content,
+		},
+	}
+
+	data, err := json.Marshal(out)
+	if err != nil {
+		t.Fatalf("json.Marshal: %v", err)
+	}
+
+	var parsed map[string]any
+	if err := json.Unmarshal(data, &parsed); err != nil {
+		t.Fatalf("json.Unmarshal: %v", err)
+	}
+
+	hso, ok := parsed["hookSpecificOutput"].(map[string]any)
+	if !ok {
+		t.Fatal("missing hookSpecificOutput key")
+	}
+	if hso["hookEventName"] != "SessionStart" {
+		t.Errorf("hookEventName = %v, want SessionStart", hso["hookEventName"])
+	}
+	ctx, ok := hso["additionalContext"].(string)
+	if !ok || !strings.Contains(ctx, "EXTREMELY_IMPORTANT") {
+		t.Error("additionalContext should contain EXTREMELY_IMPORTANT")
+	}
+}