C: bulk playbook record — operational rating wiring

POST /v1/matrix/playbooks/bulk accepts an array of playbook entries and records each independently — failures per-entry don't abort the batch. Designed for two operational use cases: 1. Backfilling historical placement data into the playbook substrate (the Rust system has 4,701 fill operations recorded with embeddings; that data deserves to feed the Go learning loop without a 4,701-call procedural script). 2. Batched click-tracking from a session's worth of coordinator interactions, posted once at idle rather than per-click. Per-entry response shape: {index, playbook_id} on success or {index, error} on failure. Caller can inspect failures without diffing. Smoke (scripts/playbook_smoke.sh, new assertion #4): Bulk POST 3 entries: 2 valid (alpha→widget-a, bravo→widget-b) + 1 invalid (empty query_text). Verifies recorded=2, failed=1, the 2 valid ones get playbook_ids back, and the invalid one surfaces its validation error in-line. Single-record /matrix/playbooks/record from 06e7152 still works unchanged; bulk is additive. The corpus field can be set per- entry or once at the batch level (entry-level wins on collision). Per the small-model autonomous pipeline framing: this is the "the playbook gets denser with each iteration" mechanism. Click tracking → bulk POST → playbook entries → future similar queries get those answers boosted via the existing /matrix/search use_playbook path. The learning loop now has both inflows wired (single + bulk) — what remains is the demo UI shim that calls /feedback on result interaction (deferred — no Go demo UI yet). 15-smoke regression all green. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-04-29 20:10:13 -05:00 · 2026-04-29 20:10:13 -05:00 · 6392772f41
commit 6392772f41
parent b199093d1f
2 changed files with 90 additions and 1 deletions
--- a/cmd/matrixd/main.go
+++ b/cmd/matrixd/main.go
@ -7,8 +7,12 @@
 //   GET  /matrix/corpora            — list known vectord indexes
 //   POST /matrix/relevance          — adjacency-pollution filter
 //   POST /matrix/downgrade          — strong-model downgrade gate
-//   POST /matrix/playbooks/record   — record a (query → answer)
+//   POST /matrix/playbooks/record   — record a single (query → answer)
 //                                      success for the learning loop
+//   POST /matrix/playbooks/bulk     — bulk-record N successes; useful
+//                                      for backfilling historical
+//                                      placement data into the
+//                                      playbook substrate
 //
 // matrixd talks to embedd (for query-text embedding) and vectord
 // (for per-corpus search) via HTTP. Both URLs come from
@ -66,6 +70,7 @@ func (h *handlers) register(r chi.Router) {
 	r.Post("/matrix/relevance", h.handleRelevance)
 	r.Post("/matrix/downgrade", h.handleDowngrade)
 	r.Post("/matrix/playbooks/record", h.handlePlaybookRecord)
+	r.Post("/matrix/playbooks/bulk", h.handlePlaybookBulk)
 }

 func (h *handlers) handleSearch(w http.ResponseWriter, r *http.Request) {
@ -142,6 +147,67 @@ func (h *handlers) handlePlaybookRecord(w http.ResponseWriter, r *http.Request)
 	})
 }

+// playbookBulkRequest is the POST /matrix/playbooks/bulk body —
+// component C (operational rating wiring). Used to backfill
+// historical placement data, or batch-record a session's worth of
+// coordinator click-tracking. Each Entry is recorded independently;
+// failures are reported per-entry without aborting the batch.
+type playbookBulkRequest struct {
+	Entries []playbookRecordRequest `json:"entries"`
+	Corpus  string                  `json:"corpus,omitempty"` // applies to all if entry-level not set
+}
+
+// playbookBulkResult reports per-entry outcomes plus the aggregate
+// count. Errors include the entry index so callers can locate the
+// offending record without diffing.
+type playbookBulkResult struct {
+	Recorded int                      `json:"recorded"`
+	Failed   int                      `json:"failed"`
+	Results  []playbookBulkItemResult `json:"results"`
+}
+
+type playbookBulkItemResult struct {
+	Index      int    `json:"index"`
+	PlaybookID string `json:"playbook_id,omitempty"`
+	Error      string `json:"error,omitempty"`
+}
+
+func (h *handlers) handlePlaybookBulk(w http.ResponseWriter, r *http.Request) {
+	var req playbookBulkRequest
+	if !decodeJSON(w, r, &req) {
+		return
+	}
+	if len(req.Entries) == 0 {
+		http.Error(w, "entries must be non-empty", http.StatusBadRequest)
+		return
+	}
+
+	out := playbookBulkResult{
+		Results: make([]playbookBulkItemResult, len(req.Entries)),
+	}
+	for i, item := range req.Entries {
+		corpus := item.Corpus
+		if corpus == "" {
+			corpus = req.Corpus
+		}
+		entry := matrix.NewPlaybookEntry(item.QueryText, item.AnswerID, item.AnswerCorpus, item.Score, item.Tags)
+		if err := entry.Validate(); err != nil {
+			out.Results[i] = playbookBulkItemResult{Index: i, Error: err.Error()}
+			out.Failed++
+			continue
+		}
+		pbID, err := h.r.Record(r.Context(), entry, corpus)
+		if err != nil {
+			out.Results[i] = playbookBulkItemResult{Index: i, Error: err.Error()}
+			out.Failed++
+			continue
+		}
+		out.Results[i] = playbookBulkItemResult{Index: i, PlaybookID: pbID}
+		out.Recorded++
+	}
+	writeJSON(w, http.StatusOK, out)
+}
+
 // downgradeRequest is the POST /matrix/downgrade body. Mirrors
 // matrix.DowngradeInput. When ForceFullOverride is omitted from
 // the body, the value falls back to matrixd's process env
--- a/scripts/playbook_smoke.sh
+++ b/scripts/playbook_smoke.sh
@ -166,6 +166,29 @@ else
  echo "  ✗ ratio out of band: $RATIO"; FAILED=1
 fi

+# ── 4. /matrix/playbooks/bulk — component C (operational rating wiring)
+echo "[playbook-smoke] bulk record 3 entries:"
+BULK_RESP="$(curl -sS -X POST http://127.0.0.1:3110/v1/matrix/playbooks/bulk \
+  -H 'Content-Type: application/json' \
+  -d "$(jq -n '{
+    entries: [
+      {query_text: "alpha test query",   answer_id: "widget-a", answer_corpus: "widgets", score: 0.9},
+      {query_text: "bravo test query",   answer_id: "widget-b", answer_corpus: "widgets", score: 0.8},
+      {query_text: "",                   answer_id: "x",        answer_corpus: "widgets", score: 0.5}
+    ]
+  }')")"
+RECORDED="$(echo "$BULK_RESP" | jq -r '.recorded')"
+FAIL="$(echo "$BULK_RESP" | jq -r '.failed')"
+GOT_PB_A="$(echo "$BULK_RESP" | jq -r '.results[0].playbook_id // empty')"
+ERR_BAD="$(echo "$BULK_RESP" | jq -r '.results[2].error // empty')"
+if [ "$RECORDED" = "2" ] && [ "$FAIL" = "1" ] && [ -n "$GOT_PB_A" ] && [ -n "$ERR_BAD" ]; then
+  echo "  ✓ 2 recorded, 1 failed (empty query_text caught), per-entry IDs/errors returned"
+else
+  echo "  ✗ recorded=$RECORDED failed=$FAIL pb_a=$GOT_PB_A err=$ERR_BAD"
+  echo "    full: $BULK_RESP"
+  FAILED=1
+fi
+
 if [ "$FAILED" -eq 0 ]; then
  echo "[playbook-smoke] Playbook acceptance gate: PASSED"
  exit 0