From 0b37a87877d24eb80f8cde163684b2e7717efac9 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Tue, 21 Apr 2026 18:25:54 -0400
Subject: [PATCH 01/23] Add .worktrees to gitignore

---
 .gitignore | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.gitignore b/.gitignore
index e1cee41ee4..c262aa0c23 100644
--- a/.gitignore
+++ b/.gitignore
@@ -47,3 +47,4 @@ coverage*
 crd-helm-wrapper
 cmd/vmcp/__debug_bin*
 /vmcp
+.worktrees/

From 7bd981630fb2f9b2def340938079736b44cedad8 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Tue, 21 Apr 2026 18:40:24 -0400
Subject: [PATCH 02/23] Add memory package types

Introduces the core domain types for ToolHive's shared long-term memory
system: MemoryEntry, MemoryRevision, typed constants for MemoryType,
AuthorType, SourceType, EntryStatus, and ArchiveReason, plus filter and
result types used by the store interface.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 pkg/memory/types.go      | 146 +++++++++++++++++++++++++++++++++++++++
 pkg/memory/types_test.go |  24 +++++++
 2 files changed, 170 insertions(+)
 create mode 100644 pkg/memory/types.go
 create mode 100644 pkg/memory/types_test.go

diff --git a/pkg/memory/types.go b/pkg/memory/types.go
new file mode 100644
index 0000000000..04fa0b1754
--- /dev/null
+++ b/pkg/memory/types.go
@@ -0,0 +1,146 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+// Package memory defines the types and interfaces for ToolHive's shared long-term memory system.
+package memory
+
+import "time"
+
+// MemoryType distinguishes the two long-term memory namespaces.
+//
+//nolint:revive // MemoryType is the canonical cross-package name; renaming to Type causes ambiguity.
+type MemoryType string
+
+const (
+	// MemoryTypeSemantic represents factual knowledge and world-state memories.
+	MemoryTypeSemantic MemoryType = "semantic"
+	// MemoryTypeProcedural represents how-to knowledge and step-based memories.
+	MemoryTypeProcedural MemoryType = "procedural"
+)
+
+// AuthorType records whether a memory was written by a human or an agent.
+type AuthorType string
+
+const (
+	// AuthorHuman indicates the memory was written by a human user.
+	AuthorHuman AuthorType = "human"
+	// AuthorAgent indicates the memory was written by an AI agent.
+	AuthorAgent AuthorType = "agent"
+)
+
+// SourceType records whether a memory entry originates from the store or is a
+// read-only index of an installed Skill.
+type SourceType string
+
+const (
+	// SourceMemory indicates the entry originates from the writable memory store.
+	SourceMemory SourceType = "memory"
+	// SourceSkill indicates the entry is a read-only index of an installed Skill.
+	SourceSkill SourceType = "skill"
+)
+
+// EntryStatus is the lifecycle state of a memory entry.
+type EntryStatus string
+
+const (
+	// EntryStatusActive indicates the entry is in normal use.
+	EntryStatusActive EntryStatus = "active"
+	// EntryStatusFlagged indicates the entry has been marked for review.
+	EntryStatusFlagged EntryStatus = "flagged"
+	// EntryStatusExpired indicates the entry has passed its TTL.
+	EntryStatusExpired EntryStatus = "expired"
+	// EntryStatusArchived indicates the entry has been moved to the archive.
+	EntryStatusArchived EntryStatus = "archived"
+)
+
+// ArchiveReason records why an entry was archived.
+type ArchiveReason string
+
+const (
+	// ArchiveReasonConsolidated indicates the entry was merged into a newer entry.
+	ArchiveReasonConsolidated ArchiveReason = "consolidated"
+	// ArchiveReasonCrystallized indicates the entry was promoted to a skill.
+	ArchiveReasonCrystallized ArchiveReason = "crystallized"
+	// ArchiveReasonManual indicates the entry was manually archived.
+	ArchiveReasonManual ArchiveReason = "manual"
+	// ArchiveReasonExpired indicates the entry exceeded its TTL.
+	ArchiveReasonExpired ArchiveReason = "expired"
+)
+
+// MemoryEntry is the core domain type representing one stored memory.
+//
+//nolint:revive // MemoryEntry is the canonical cross-package name; renaming to Entry conflicts with common identifiers.
+type MemoryEntry struct {
+	ID               string
+	Type             MemoryType
+	Content          string
+	Tags             []string
+	Author           AuthorType
+	AgentID          string
+	SessionID        string
+	Source           SourceType
+	SkillRef         string
+	Status           EntryStatus
+	TrustScore       float32
+	StalenessScore   float32
+	AccessCount      int
+	LastAccessedAt   time.Time
+	FlaggedAt        *time.Time
+	FlagReason       string
+	TTLDays          *int
+	ExpiresAt        *time.Time
+	ArchivedAt       *time.Time
+	ConsolidatedInto string
+	CrystallizedInto string
+	History          []MemoryRevision
+	CreatedAt        time.Time
+	UpdatedAt        time.Time
+}
+
+// MemoryRevision records a single correction to a memory entry.
+//
+//nolint:revive // MemoryRevision is the canonical cross-package name; renaming to Revision causes ambiguity.
+type MemoryRevision struct {
+	Content        string
+	Author         AuthorType
+	CorrectionNote string
+	Timestamp      time.Time
+}
+
+// ListFilter restricts results returned by MemoryStore.List.
+type ListFilter struct {
+	Type   *MemoryType
+	Author *AuthorType
+	Tags   []string
+	Source *SourceType
+	Status *EntryStatus
+	Limit  int
+	Offset int
+}
+
+// VectorFilter restricts similarity search to a subset of entries.
+type VectorFilter struct {
+	Type   *MemoryType
+	Status *EntryStatus
+}
+
+// ScoredID pairs an entry ID with its cosine similarity to a query.
+type ScoredID struct {
+	ID         string
+	Similarity float32
+}
+
+// ScoredEntry pairs a full MemoryEntry with its similarity to a query.
+type ScoredEntry struct {
+	Entry      MemoryEntry
+	Similarity float32
+}
+
+// ConflictResult describes a potentially conflicting existing memory returned
+// during a write conflict check.
+type ConflictResult struct {
+	ID         string
+	Content    string
+	Similarity float32
+	TrustScore float32
+}
diff --git a/pkg/memory/types_test.go b/pkg/memory/types_test.go
new file mode 100644
index 0000000000..86b255f32f
--- /dev/null
+++ b/pkg/memory/types_test.go
@@ -0,0 +1,24 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package memory_test
+
+import (
+	"testing"
+
+	"github.com/stretchr/testify/require"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+func TestMemoryTypeConstants(t *testing.T) {
+	t.Parallel()
+	require.Equal(t, memory.MemoryType("semantic"), memory.MemoryTypeSemantic)
+	require.Equal(t, memory.MemoryType("procedural"), memory.MemoryTypeProcedural)
+	require.Equal(t, memory.AuthorType("human"), memory.AuthorHuman)
+	require.Equal(t, memory.AuthorType("agent"), memory.AuthorAgent)
+	require.Equal(t, memory.EntryStatus("active"), memory.EntryStatusActive)
+	require.Equal(t, memory.EntryStatus("flagged"), memory.EntryStatusFlagged)
+	require.Equal(t, memory.EntryStatus("expired"), memory.EntryStatusExpired)
+	require.Equal(t, memory.EntryStatus("archived"), memory.EntryStatusArchived)
+}

From 3bf0acf3ce55fd4722d8f37f15f82198969800ca Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Wed, 22 Apr 2026 10:54:29 -0400
Subject: [PATCH 03/23] Add shared long-term memory server core package
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Introduces pkg/memory with three pluggable interfaces (Store, VectorStore,
Embedder), a Service orchestration layer with conflict detection and
score-weighted search ranking, SQLite-backed implementations, an Ollama
embedder, and gomock mocks for all interfaces.

Key behaviours:
- Conflict detection on write: cosine similarity > 0.85 blocks the write
  and returns conflicting entries for the agent to resolve
- Trust scoring: author weight × age decay × correction penalty × flag multiplier
- Staleness scoring: access age + flag bonus + correction bonus
- Search ranking: composite score (similarity × trust × staleness penalty)
  so flagged/stale entries do not rank above fresh, trusted ones
- TypeEpisodic memory type for time-indexed event records
- ListFilter time-range fields (CreatedAfter/CreatedBefore) for timeline queries
- SQLite migration 002 widens the type CHECK constraint to include episodic

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 pkg/memory/embedder/ollama/embedder.go        |  88 +++++
 pkg/memory/embedder/ollama/embedder_test.go   |  35 ++
 pkg/memory/errors.go                          |   9 +
 pkg/memory/interfaces.go                      |  51 +++
 pkg/memory/mocks/mock_embedder.go             |  70 ++++
 pkg/memory/mocks/mock_store.go                | 214 ++++++++++
 pkg/memory/mocks/mock_vector.go               |  85 ++++
 pkg/memory/scoring.go                         |  70 ++++
 pkg/memory/scoring_test.go                    | 138 +++++++
 pkg/memory/service.go                         | 205 ++++++++++
 pkg/memory/service_test.go                    | 153 ++++++++
 pkg/memory/sqlite/db.go                       | 106 +++++
 pkg/memory/sqlite/migrations/001_initial.sql  |  60 +++
 .../migrations/002_add_episodic_type.sql      |  83 ++++
 pkg/memory/sqlite/store.go                    | 364 ++++++++++++++++++
 pkg/memory/sqlite/store_test.go               | 167 ++++++++
 pkg/memory/sqlite/vector.go                   | 127 ++++++
 pkg/memory/sqlite/vector_test.go              |  74 ++++
 pkg/memory/types.go                           |  57 +--
 pkg/memory/types_test.go                      |  11 +-
 20 files changed, 2137 insertions(+), 30 deletions(-)
 create mode 100644 pkg/memory/embedder/ollama/embedder.go
 create mode 100644 pkg/memory/embedder/ollama/embedder_test.go
 create mode 100644 pkg/memory/errors.go
 create mode 100644 pkg/memory/interfaces.go
 create mode 100644 pkg/memory/mocks/mock_embedder.go
 create mode 100644 pkg/memory/mocks/mock_store.go
 create mode 100644 pkg/memory/mocks/mock_vector.go
 create mode 100644 pkg/memory/scoring.go
 create mode 100644 pkg/memory/scoring_test.go
 create mode 100644 pkg/memory/service.go
 create mode 100644 pkg/memory/service_test.go
 create mode 100644 pkg/memory/sqlite/db.go
 create mode 100644 pkg/memory/sqlite/migrations/001_initial.sql
 create mode 100644 pkg/memory/sqlite/migrations/002_add_episodic_type.sql
 create mode 100644 pkg/memory/sqlite/store.go
 create mode 100644 pkg/memory/sqlite/store_test.go
 create mode 100644 pkg/memory/sqlite/vector.go
 create mode 100644 pkg/memory/sqlite/vector_test.go

diff --git a/pkg/memory/embedder/ollama/embedder.go b/pkg/memory/embedder/ollama/embedder.go
new file mode 100644
index 0000000000..00ca3817ee
--- /dev/null
+++ b/pkg/memory/embedder/ollama/embedder.go
@@ -0,0 +1,88 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+// Package ollama provides a memory.Embedder backed by a local Ollama server.
+package ollama
+
+import (
+	"bytes"
+	"context"
+	"encoding/json"
+	"fmt"
+	"io"
+	"net/http"
+	"net/url"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// Embedder calls the Ollama /api/embeddings endpoint.
+type Embedder struct {
+	baseURL    string
+	model      string
+	dimensions int
+	client     *http.Client
+}
+
+// New creates an Ollama embedder. It probes the server once to discover the
+// embedding dimension. Returns an error if the server is unreachable or the
+// model returns an empty vector.
+func New(baseURL, model string) (*Embedder, error) {
+	if _, err := url.ParseRequestURI(baseURL); err != nil {
+		return nil, fmt.Errorf("invalid Ollama URL %q: %w", baseURL, err)
+	}
+	if model == "" {
+		return nil, fmt.Errorf("model name is required")
+	}
+	e := &Embedder{baseURL: baseURL, model: model, client: &http.Client{}}
+
+	emb, err := e.Embed(context.Background(), "probe")
+	if err != nil {
+		return nil, fmt.Errorf("probing Ollama embedder: %w", err)
+	}
+	e.dimensions = len(emb)
+	return e, nil
+}
+
+// Embed calls the Ollama /api/embeddings endpoint and returns the vector.
+func (e *Embedder) Embed(ctx context.Context, text string) ([]float32, error) {
+	body, err := json.Marshal(map[string]string{"model": e.model, "prompt": text})
+	if err != nil {
+		return nil, err
+	}
+
+	req, err := http.NewRequestWithContext(ctx, http.MethodPost, e.baseURL+"/api/embeddings", bytes.NewReader(body))
+	if err != nil {
+		return nil, err
+	}
+	req.Header.Set("Content-Type", "application/json")
+
+	resp, err := e.client.Do(req)
+	if err != nil {
+		return nil, fmt.Errorf("calling Ollama: %w", err)
+	}
+	defer func() {
+		_, _ = io.Copy(io.Discard, resp.Body)
+		_ = resp.Body.Close()
+	}()
+
+	if resp.StatusCode != http.StatusOK {
+		return nil, fmt.Errorf("ollama returned status %d", resp.StatusCode)
+	}
+
+	var result struct {
+		Embedding []float32 `json:"embedding"`
+	}
+	if err := json.NewDecoder(resp.Body).Decode(&result); err != nil {
+		return nil, fmt.Errorf("decoding Ollama response: %w", err)
+	}
+	if len(result.Embedding) == 0 {
+		return nil, fmt.Errorf("ollama returned empty embedding")
+	}
+	return result.Embedding, nil
+}
+
+// Dimensions returns the fixed vector length produced by this embedder.
+func (e *Embedder) Dimensions() int { return e.dimensions }
+
+var _ memory.Embedder = (*Embedder)(nil)
diff --git a/pkg/memory/embedder/ollama/embedder_test.go b/pkg/memory/embedder/ollama/embedder_test.go
new file mode 100644
index 0000000000..bb601fae1b
--- /dev/null
+++ b/pkg/memory/embedder/ollama/embedder_test.go
@@ -0,0 +1,35 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package ollama_test
+
+import (
+	"context"
+	"encoding/json"
+	"net/http"
+	"net/http/httptest"
+	"testing"
+
+	"github.com/stretchr/testify/require"
+
+	"github.com/stacklok/toolhive/pkg/memory/embedder/ollama"
+)
+
+func TestEmbed(t *testing.T) {
+	t.Parallel()
+
+	want := []float32{0.1, 0.2, 0.3}
+	srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+		require.Equal(t, "/api/embeddings", r.URL.Path)
+		_ = json.NewEncoder(w).Encode(map[string]any{"embedding": want})
+	}))
+	t.Cleanup(srv.Close)
+
+	e, err := ollama.New(srv.URL, "nomic-embed-text")
+	require.NoError(t, err)
+	require.Equal(t, 3, e.Dimensions())
+
+	got, err := e.Embed(context.Background(), "hello world")
+	require.NoError(t, err)
+	require.InDeltaSlice(t, want, got, 0.001)
+}
diff --git a/pkg/memory/errors.go b/pkg/memory/errors.go
new file mode 100644
index 0000000000..b17a40c1a2
--- /dev/null
+++ b/pkg/memory/errors.go
@@ -0,0 +1,9 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package memory
+
+import "errors"
+
+// ErrNotFound is returned when a memory entry does not exist.
+var ErrNotFound = errors.New("memory entry not found")
diff --git a/pkg/memory/interfaces.go b/pkg/memory/interfaces.go
new file mode 100644
index 0000000000..5f26d39076
--- /dev/null
+++ b/pkg/memory/interfaces.go
@@ -0,0 +1,51 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package memory
+
+import "context"
+
+//go:generate mockgen -destination mocks/mock_store.go -package mocks github.com/stacklok/toolhive/pkg/memory Store
+//go:generate mockgen -destination mocks/mock_vector.go -package mocks github.com/stacklok/toolhive/pkg/memory VectorStore
+//go:generate mockgen -destination mocks/mock_embedder.go -package mocks github.com/stacklok/toolhive/pkg/memory Embedder
+
+// Store is the structured persistence layer for memory entries.
+// It handles CRUD, lifecycle transitions, and score updates.
+// Implementations must be safe for concurrent use.
+type Store interface {
+	Create(ctx context.Context, entry Entry) error
+	Get(ctx context.Context, id string) (Entry, error)
+	// Update replaces the content of an existing entry and appends the
+	// previous content to History. The embedding must be recomputed by
+	// the caller (Service) after this call succeeds.
+	Update(ctx context.Context, id string, content string, author AuthorType, correctionNote string) error
+	Flag(ctx context.Context, id string, reason string) error
+	Unflag(ctx context.Context, id string) error
+	Delete(ctx context.Context, id string) error
+	List(ctx context.Context, filter ListFilter) ([]Entry, error)
+	Archive(ctx context.Context, id string, reason ArchiveReason, ref string) error
+	IncrementAccess(ctx context.Context, id string) error
+	UpdateScores(ctx context.Context, id string, trustScore, stalenessScore float32) error
+	// ListExpired returns all active entries whose ExpiresAt is in the past.
+	ListExpired(ctx context.Context) ([]Entry, error)
+	// ListActive returns all non-archived entries for score recomputation.
+	ListActive(ctx context.Context) ([]Entry, error)
+}
+
+// VectorStore stores and queries embedding vectors for memory entries.
+// Implementations must be safe for concurrent use.
+type VectorStore interface {
+	// Upsert stores or replaces the embedding for the given entry ID.
+	Upsert(ctx context.Context, id string, embedding []float32) error
+	// Search returns the topK entries most similar to query, restricted by filter.
+	Search(ctx context.Context, query []float32, topK int, filter VectorFilter) ([]ScoredID, error)
+	Delete(ctx context.Context, id string) error
+}
+
+// Embedder converts text to a fixed-dimension float32 vector.
+// Implementations must be safe for concurrent use.
+type Embedder interface {
+	Embed(ctx context.Context, text string) ([]float32, error)
+	// Dimensions returns the fixed vector length produced by this embedder.
+	Dimensions() int
+}
diff --git a/pkg/memory/mocks/mock_embedder.go b/pkg/memory/mocks/mock_embedder.go
new file mode 100644
index 0000000000..ee6fbc7b24
--- /dev/null
+++ b/pkg/memory/mocks/mock_embedder.go
@@ -0,0 +1,70 @@
+// Code generated by MockGen. DO NOT EDIT.
+// Source: github.com/stacklok/toolhive/pkg/memory (interfaces: Embedder)
+//
+// Generated by this command:
+//
+//	mockgen -destination mocks/mock_embedder.go -package mocks github.com/stacklok/toolhive/pkg/memory Embedder
+//
+
+// Package mocks is a generated GoMock package.
+package mocks
+
+import (
+	context "context"
+	reflect "reflect"
+
+	gomock "go.uber.org/mock/gomock"
+)
+
+// MockEmbedder is a mock of Embedder interface.
+type MockEmbedder struct {
+	ctrl     *gomock.Controller
+	recorder *MockEmbedderMockRecorder
+	isgomock struct{}
+}
+
+// MockEmbedderMockRecorder is the mock recorder for MockEmbedder.
+type MockEmbedderMockRecorder struct {
+	mock *MockEmbedder
+}
+
+// NewMockEmbedder creates a new mock instance.
+func NewMockEmbedder(ctrl *gomock.Controller) *MockEmbedder {
+	mock := &MockEmbedder{ctrl: ctrl}
+	mock.recorder = &MockEmbedderMockRecorder{mock}
+	return mock
+}
+
+// EXPECT returns an object that allows the caller to indicate expected use.
+func (m *MockEmbedder) EXPECT() *MockEmbedderMockRecorder {
+	return m.recorder
+}
+
+// Dimensions mocks base method.
+func (m *MockEmbedder) Dimensions() int {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Dimensions")
+	ret0, _ := ret[0].(int)
+	return ret0
+}
+
+// Dimensions indicates an expected call of Dimensions.
+func (mr *MockEmbedderMockRecorder) Dimensions() *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Dimensions", reflect.TypeOf((*MockEmbedder)(nil).Dimensions))
+}
+
+// Embed mocks base method.
+func (m *MockEmbedder) Embed(ctx context.Context, text string) ([]float32, error) {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Embed", ctx, text)
+	ret0, _ := ret[0].([]float32)
+	ret1, _ := ret[1].(error)
+	return ret0, ret1
+}
+
+// Embed indicates an expected call of Embed.
+func (mr *MockEmbedderMockRecorder) Embed(ctx, text any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Embed", reflect.TypeOf((*MockEmbedder)(nil).Embed), ctx, text)
+}
diff --git a/pkg/memory/mocks/mock_store.go b/pkg/memory/mocks/mock_store.go
new file mode 100644
index 0000000000..29e3d1f860
--- /dev/null
+++ b/pkg/memory/mocks/mock_store.go
@@ -0,0 +1,214 @@
+// Code generated by MockGen. DO NOT EDIT.
+// Source: github.com/stacklok/toolhive/pkg/memory (interfaces: Store)
+//
+// Generated by this command:
+//
+//	mockgen -destination mocks/mock_store.go -package mocks github.com/stacklok/toolhive/pkg/memory Store
+//
+
+// Package mocks is a generated GoMock package.
+package mocks
+
+import (
+	context "context"
+	reflect "reflect"
+
+	memory "github.com/stacklok/toolhive/pkg/memory"
+	gomock "go.uber.org/mock/gomock"
+)
+
+// MockStore is a mock of Store interface.
+type MockStore struct {
+	ctrl     *gomock.Controller
+	recorder *MockStoreMockRecorder
+	isgomock struct{}
+}
+
+// MockStoreMockRecorder is the mock recorder for MockStore.
+type MockStoreMockRecorder struct {
+	mock *MockStore
+}
+
+// NewMockStore creates a new mock instance.
+func NewMockStore(ctrl *gomock.Controller) *MockStore {
+	mock := &MockStore{ctrl: ctrl}
+	mock.recorder = &MockStoreMockRecorder{mock}
+	return mock
+}
+
+// EXPECT returns an object that allows the caller to indicate expected use.
+func (m *MockStore) EXPECT() *MockStoreMockRecorder {
+	return m.recorder
+}
+
+// Archive mocks base method.
+func (m *MockStore) Archive(ctx context.Context, id string, reason memory.ArchiveReason, ref string) error {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Archive", ctx, id, reason, ref)
+	ret0, _ := ret[0].(error)
+	return ret0
+}
+
+// Archive indicates an expected call of Archive.
+func (mr *MockStoreMockRecorder) Archive(ctx, id, reason, ref any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Archive", reflect.TypeOf((*MockStore)(nil).Archive), ctx, id, reason, ref)
+}
+
+// Create mocks base method.
+func (m *MockStore) Create(ctx context.Context, entry memory.Entry) error {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Create", ctx, entry)
+	ret0, _ := ret[0].(error)
+	return ret0
+}
+
+// Create indicates an expected call of Create.
+func (mr *MockStoreMockRecorder) Create(ctx, entry any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Create", reflect.TypeOf((*MockStore)(nil).Create), ctx, entry)
+}
+
+// Delete mocks base method.
+func (m *MockStore) Delete(ctx context.Context, id string) error {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Delete", ctx, id)
+	ret0, _ := ret[0].(error)
+	return ret0
+}
+
+// Delete indicates an expected call of Delete.
+func (mr *MockStoreMockRecorder) Delete(ctx, id any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Delete", reflect.TypeOf((*MockStore)(nil).Delete), ctx, id)
+}
+
+// Flag mocks base method.
+func (m *MockStore) Flag(ctx context.Context, id, reason string) error {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Flag", ctx, id, reason)
+	ret0, _ := ret[0].(error)
+	return ret0
+}
+
+// Flag indicates an expected call of Flag.
+func (mr *MockStoreMockRecorder) Flag(ctx, id, reason any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Flag", reflect.TypeOf((*MockStore)(nil).Flag), ctx, id, reason)
+}
+
+// Get mocks base method.
+func (m *MockStore) Get(ctx context.Context, id string) (memory.Entry, error) {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Get", ctx, id)
+	ret0, _ := ret[0].(memory.Entry)
+	ret1, _ := ret[1].(error)
+	return ret0, ret1
+}
+
+// Get indicates an expected call of Get.
+func (mr *MockStoreMockRecorder) Get(ctx, id any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Get", reflect.TypeOf((*MockStore)(nil).Get), ctx, id)
+}
+
+// IncrementAccess mocks base method.
+func (m *MockStore) IncrementAccess(ctx context.Context, id string) error {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "IncrementAccess", ctx, id)
+	ret0, _ := ret[0].(error)
+	return ret0
+}
+
+// IncrementAccess indicates an expected call of IncrementAccess.
+func (mr *MockStoreMockRecorder) IncrementAccess(ctx, id any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "IncrementAccess", reflect.TypeOf((*MockStore)(nil).IncrementAccess), ctx, id)
+}
+
+// List mocks base method.
+func (m *MockStore) List(ctx context.Context, filter memory.ListFilter) ([]memory.Entry, error) {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "List", ctx, filter)
+	ret0, _ := ret[0].([]memory.Entry)
+	ret1, _ := ret[1].(error)
+	return ret0, ret1
+}
+
+// List indicates an expected call of List.
+func (mr *MockStoreMockRecorder) List(ctx, filter any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "List", reflect.TypeOf((*MockStore)(nil).List), ctx, filter)
+}
+
+// ListActive mocks base method.
+func (m *MockStore) ListActive(ctx context.Context) ([]memory.Entry, error) {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "ListActive", ctx)
+	ret0, _ := ret[0].([]memory.Entry)
+	ret1, _ := ret[1].(error)
+	return ret0, ret1
+}
+
+// ListActive indicates an expected call of ListActive.
+func (mr *MockStoreMockRecorder) ListActive(ctx any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "ListActive", reflect.TypeOf((*MockStore)(nil).ListActive), ctx)
+}
+
+// ListExpired mocks base method.
+func (m *MockStore) ListExpired(ctx context.Context) ([]memory.Entry, error) {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "ListExpired", ctx)
+	ret0, _ := ret[0].([]memory.Entry)
+	ret1, _ := ret[1].(error)
+	return ret0, ret1
+}
+
+// ListExpired indicates an expected call of ListExpired.
+func (mr *MockStoreMockRecorder) ListExpired(ctx any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "ListExpired", reflect.TypeOf((*MockStore)(nil).ListExpired), ctx)
+}
+
+// Unflag mocks base method.
+func (m *MockStore) Unflag(ctx context.Context, id string) error {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Unflag", ctx, id)
+	ret0, _ := ret[0].(error)
+	return ret0
+}
+
+// Unflag indicates an expected call of Unflag.
+func (mr *MockStoreMockRecorder) Unflag(ctx, id any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Unflag", reflect.TypeOf((*MockStore)(nil).Unflag), ctx, id)
+}
+
+// Update mocks base method.
+func (m *MockStore) Update(ctx context.Context, id, content string, author memory.AuthorType, correctionNote string) error {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Update", ctx, id, content, author, correctionNote)
+	ret0, _ := ret[0].(error)
+	return ret0
+}
+
+// Update indicates an expected call of Update.
+func (mr *MockStoreMockRecorder) Update(ctx, id, content, author, correctionNote any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Update", reflect.TypeOf((*MockStore)(nil).Update), ctx, id, content, author, correctionNote)
+}
+
+// UpdateScores mocks base method.
+func (m *MockStore) UpdateScores(ctx context.Context, id string, trustScore, stalenessScore float32) error {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "UpdateScores", ctx, id, trustScore, stalenessScore)
+	ret0, _ := ret[0].(error)
+	return ret0
+}
+
+// UpdateScores indicates an expected call of UpdateScores.
+func (mr *MockStoreMockRecorder) UpdateScores(ctx, id, trustScore, stalenessScore any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "UpdateScores", reflect.TypeOf((*MockStore)(nil).UpdateScores), ctx, id, trustScore, stalenessScore)
+}
diff --git a/pkg/memory/mocks/mock_vector.go b/pkg/memory/mocks/mock_vector.go
new file mode 100644
index 0000000000..0df2f3d80c
--- /dev/null
+++ b/pkg/memory/mocks/mock_vector.go
@@ -0,0 +1,85 @@
+// Code generated by MockGen. DO NOT EDIT.
+// Source: github.com/stacklok/toolhive/pkg/memory (interfaces: VectorStore)
+//
+// Generated by this command:
+//
+//	mockgen -destination mocks/mock_vector.go -package mocks github.com/stacklok/toolhive/pkg/memory VectorStore
+//
+
+// Package mocks is a generated GoMock package.
+package mocks
+
+import (
+	context "context"
+	reflect "reflect"
+
+	memory "github.com/stacklok/toolhive/pkg/memory"
+	gomock "go.uber.org/mock/gomock"
+)
+
+// MockVectorStore is a mock of VectorStore interface.
+type MockVectorStore struct {
+	ctrl     *gomock.Controller
+	recorder *MockVectorStoreMockRecorder
+	isgomock struct{}
+}
+
+// MockVectorStoreMockRecorder is the mock recorder for MockVectorStore.
+type MockVectorStoreMockRecorder struct {
+	mock *MockVectorStore
+}
+
+// NewMockVectorStore creates a new mock instance.
+func NewMockVectorStore(ctrl *gomock.Controller) *MockVectorStore {
+	mock := &MockVectorStore{ctrl: ctrl}
+	mock.recorder = &MockVectorStoreMockRecorder{mock}
+	return mock
+}
+
+// EXPECT returns an object that allows the caller to indicate expected use.
+func (m *MockVectorStore) EXPECT() *MockVectorStoreMockRecorder {
+	return m.recorder
+}
+
+// Delete mocks base method.
+func (m *MockVectorStore) Delete(ctx context.Context, id string) error {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Delete", ctx, id)
+	ret0, _ := ret[0].(error)
+	return ret0
+}
+
+// Delete indicates an expected call of Delete.
+func (mr *MockVectorStoreMockRecorder) Delete(ctx, id any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Delete", reflect.TypeOf((*MockVectorStore)(nil).Delete), ctx, id)
+}
+
+// Search mocks base method.
+func (m *MockVectorStore) Search(ctx context.Context, query []float32, topK int, filter memory.VectorFilter) ([]memory.ScoredID, error) {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Search", ctx, query, topK, filter)
+	ret0, _ := ret[0].([]memory.ScoredID)
+	ret1, _ := ret[1].(error)
+	return ret0, ret1
+}
+
+// Search indicates an expected call of Search.
+func (mr *MockVectorStoreMockRecorder) Search(ctx, query, topK, filter any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Search", reflect.TypeOf((*MockVectorStore)(nil).Search), ctx, query, topK, filter)
+}
+
+// Upsert mocks base method.
+func (m *MockVectorStore) Upsert(ctx context.Context, id string, embedding []float32) error {
+	m.ctrl.T.Helper()
+	ret := m.ctrl.Call(m, "Upsert", ctx, id, embedding)
+	ret0, _ := ret[0].(error)
+	return ret0
+}
+
+// Upsert indicates an expected call of Upsert.
+func (mr *MockVectorStoreMockRecorder) Upsert(ctx, id, embedding any) *gomock.Call {
+	mr.mock.ctrl.T.Helper()
+	return mr.mock.ctrl.RecordCallWithMethodType(mr.mock, "Upsert", reflect.TypeOf((*MockVectorStore)(nil).Upsert), ctx, id, embedding)
+}
diff --git a/pkg/memory/scoring.go b/pkg/memory/scoring.go
new file mode 100644
index 0000000000..93997aff87
--- /dev/null
+++ b/pkg/memory/scoring.go
@@ -0,0 +1,70 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package memory
+
+import (
+	"math"
+	"time"
+)
+
+const (
+	authorWeightHuman              = 1.0
+	authorWeightAgent              = 0.7
+	halfLifeDays                   = 180.0
+	maxCorrectionPenalty           = 0.30
+	correctionPenaltyPerCorrection = 0.05
+	flagTrustMultiplier            = 0.5
+	maxStalenessAccessDays         = 90.0
+	flagStalenessBonus             = 0.3
+	correctionStalenessPerItem     = 0.1
+	maxCorrectionStaleness         = 0.3
+)
+
+// ComputeTrustScore returns a value in [0,1] representing how trustworthy
+// this memory entry is. Higher = more trustworthy.
+//
+// Formula: author_weight × age_decay × (1 - correction_penalty) × flag_multiplier
+func ComputeTrustScore(entry Entry) float32 {
+	weight := authorWeightAgent
+	if entry.Author == AuthorHuman {
+		weight = authorWeightHuman
+	}
+
+	ageInDays := time.Since(entry.CreatedAt).Hours() / 24
+	decay := math.Exp(-ageInDays * math.Log(2) / halfLifeDays)
+
+	corrections := len(entry.History)
+	correctionPenalty := math.Min(float64(corrections)*correctionPenaltyPerCorrection, maxCorrectionPenalty)
+
+	flagMultiplier := 1.0
+	if entry.FlaggedAt != nil {
+		flagMultiplier = flagTrustMultiplier
+	}
+
+	score := weight * decay * (1 - correctionPenalty) * flagMultiplier
+	return float32(math.Max(0, math.Min(1, score)))
+}
+
+// ComputeStalenessScore returns a value in [0,1] representing how stale
+// this memory entry is. Higher = more stale (more likely to need review).
+//
+// Formula: access_age_normalized + flag_bonus + correction_bonus
+func ComputeStalenessScore(entry Entry) float32 {
+	lastAccess := entry.LastAccessedAt
+	if lastAccess.IsZero() {
+		lastAccess = entry.CreatedAt
+	}
+	daysSinceAccess := time.Since(lastAccess).Hours() / 24
+	base := math.Min(daysSinceAccess/maxStalenessAccessDays, 1.0)
+
+	flagBonus := 0.0
+	if entry.FlaggedAt != nil {
+		flagBonus = flagStalenessBonus
+	}
+
+	corrections := len(entry.History)
+	correctionBonus := math.Min(float64(corrections)*correctionStalenessPerItem, maxCorrectionStaleness)
+
+	return float32(math.Min(1.0, base+flagBonus+correctionBonus))
+}
diff --git a/pkg/memory/scoring_test.go b/pkg/memory/scoring_test.go
new file mode 100644
index 0000000000..e8a5da982e
--- /dev/null
+++ b/pkg/memory/scoring_test.go
@@ -0,0 +1,138 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package memory_test
+
+import (
+	"testing"
+	"time"
+
+	"github.com/stretchr/testify/require"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+func TestComputeTrustScore(t *testing.T) {
+	t.Parallel()
+	now := time.Now()
+
+	tests := []struct {
+		name    string
+		entry   memory.Entry
+		wantMin float32
+		wantMax float32
+	}{
+		{
+			name: "fresh human entry has high trust",
+			entry: memory.Entry{
+				Author:    memory.AuthorHuman,
+				CreatedAt: now,
+			},
+			wantMin: 0.95,
+			wantMax: 1.0,
+		},
+		{
+			name: "fresh agent entry has lower trust than human",
+			entry: memory.Entry{
+				Author:    memory.AuthorAgent,
+				CreatedAt: now,
+			},
+			wantMin: 0.65,
+			wantMax: 0.75,
+		},
+		{
+			name: "flagged entry has halved trust",
+			entry: func() memory.Entry {
+				ft := now
+				return memory.Entry{
+					Author:    memory.AuthorHuman,
+					CreatedAt: now,
+					FlaggedAt: &ft,
+				}
+			}(),
+			wantMin: 0.45,
+			wantMax: 0.55,
+		},
+		{
+			name: "two corrections reduce trust",
+			entry: memory.Entry{
+				Author:    memory.AuthorHuman,
+				CreatedAt: now,
+				History:   []memory.Revision{{}, {}},
+			},
+			wantMin: 0.85,
+			wantMax: 0.95,
+		},
+		{
+			name: "old entry has decayed trust",
+			entry: memory.Entry{
+				Author:    memory.AuthorHuman,
+				CreatedAt: now.AddDate(0, 0, -180), // half-life
+			},
+			wantMin: 0.45,
+			wantMax: 0.55,
+		},
+	}
+
+	for _, tc := range tests {
+		t.Run(tc.name, func(t *testing.T) {
+			t.Parallel()
+			score := memory.ComputeTrustScore(tc.entry)
+			require.GreaterOrEqual(t, score, tc.wantMin, "trust score too low")
+			require.LessOrEqual(t, score, tc.wantMax, "trust score too high")
+		})
+	}
+}
+
+func TestComputeStalenessScore(t *testing.T) {
+	t.Parallel()
+	now := time.Now()
+
+	tests := []struct {
+		name    string
+		entry   memory.Entry
+		wantMin float32
+		wantMax float32
+	}{
+		{
+			name: "recently accessed entry is fresh",
+			entry: memory.Entry{
+				CreatedAt:      now,
+				LastAccessedAt: now,
+			},
+			wantMin: 0.0,
+			wantMax: 0.05,
+		},
+		{
+			name: "entry not accessed for 90 days is stale",
+			entry: memory.Entry{
+				CreatedAt:      now.AddDate(0, 0, -90),
+				LastAccessedAt: now.AddDate(0, 0, -90),
+			},
+			wantMin: 0.95,
+			wantMax: 1.0,
+		},
+		{
+			name: "flagged entry adds staleness bonus",
+			entry: func() memory.Entry {
+				ft := now
+				return memory.Entry{
+					CreatedAt:      now,
+					LastAccessedAt: now,
+					FlaggedAt:      &ft,
+				}
+			}(),
+			wantMin: 0.28,
+			wantMax: 0.32,
+		},
+	}
+
+	for _, tc := range tests {
+		t.Run(tc.name, func(t *testing.T) {
+			t.Parallel()
+			score := memory.ComputeStalenessScore(tc.entry)
+			require.GreaterOrEqual(t, score, tc.wantMin)
+			require.LessOrEqual(t, score, tc.wantMax)
+		})
+	}
+}
diff --git a/pkg/memory/service.go b/pkg/memory/service.go
new file mode 100644
index 0000000000..7db0e45f82
--- /dev/null
+++ b/pkg/memory/service.go
@@ -0,0 +1,205 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package memory
+
+import (
+	"context"
+	"fmt"
+	"sort"
+	"time"
+
+	"github.com/google/uuid"
+	"go.uber.org/zap"
+)
+
+const (
+	conflictSimilarityThreshold = float32(0.85)
+	defaultConflictTopK         = 5
+	// stalenessSearchPenaltyWeight controls how much staleness reduces ranking score.
+	stalenessSearchPenaltyWeight = float32(0.3)
+)
+
+// Service orchestrates Store, VectorStore, and Embedder to provide
+// the full memory lifecycle including conflict detection and scoring.
+type Service struct {
+	store    Store
+	vectors  VectorStore
+	embedder Embedder
+	log      *zap.Logger
+}
+
+// NewService constructs a Service. All dependencies are required.
+//
+// The Store provides durable persistence for memory entries.
+// The VectorStore enables semantic similarity search over entry embeddings.
+// The Embedder converts text to vectors; the caller is responsible for
+// ensuring the same Embedder is used consistently — switching embedders
+// will invalidate stored vectors.
+func NewService(store Store, vectors VectorStore, embedder Embedder, log *zap.Logger) (*Service, error) {
+	if store == nil {
+		return nil, fmt.Errorf("store is required")
+	}
+	if vectors == nil {
+		return nil, fmt.Errorf("vector store is required")
+	}
+	if embedder == nil {
+		return nil, fmt.Errorf("embedder is required")
+	}
+	if log == nil {
+		return nil, fmt.Errorf("logger is required")
+	}
+	return &Service{store: store, vectors: vectors, embedder: embedder, log: log}, nil
+}
+
+// RememberInput is the input to Service.Remember.
+type RememberInput struct {
+	Content   string
+	Type      Type
+	Tags      []string
+	Author    AuthorType
+	AgentID   string
+	SessionID string
+	Source    SourceType
+	SkillRef  string
+	TTLDays   *int
+	// Force bypasses conflict detection and writes unconditionally.
+	Force bool
+}
+
+// RememberResult is returned by Service.Remember.
+// If Conflicts is non-empty, MemoryID is empty and the write was not performed.
+type RememberResult struct {
+	MemoryID  string
+	Conflicts []ConflictResult
+}
+
+// Remember embeds content, checks for conflicts, and writes the entry if none found.
+// When Force is true the conflict check is skipped entirely.
+func (s *Service) Remember(ctx context.Context, in RememberInput) (*RememberResult, error) {
+	embedding, err := s.embedder.Embed(ctx, in.Content)
+	if err != nil {
+		return nil, fmt.Errorf("embedding content: %w", err)
+	}
+
+	if !in.Force {
+		conflicts, err := s.detectConflicts(ctx, embedding, in.Type)
+		if err != nil {
+			return nil, fmt.Errorf("detecting conflicts: %w", err)
+		}
+		if len(conflicts) > 0 {
+			return &RememberResult{Conflicts: conflicts}, nil
+		}
+	}
+
+	id := "mem_" + uuid.New().String()
+	now := time.Now().UTC()
+	entry := Entry{
+		ID:        id,
+		Type:      in.Type,
+		Content:   in.Content,
+		Tags:      in.Tags,
+		Author:    in.Author,
+		AgentID:   in.AgentID,
+		SessionID: in.SessionID,
+		Source:    sourceOrDefault(in.Source),
+		SkillRef:  in.SkillRef,
+		Status:    EntryStatusActive,
+		TTLDays:   in.TTLDays,
+		CreatedAt: now,
+		UpdatedAt: now,
+	}
+	if in.TTLDays != nil {
+		t := now.AddDate(0, 0, *in.TTLDays)
+		entry.ExpiresAt = &t
+	}
+	entry.TrustScore = ComputeTrustScore(entry)
+	entry.StalenessScore = ComputeStalenessScore(entry)
+
+	if err := s.store.Create(ctx, entry); err != nil {
+		return nil, fmt.Errorf("creating entry: %w", err)
+	}
+	if err := s.vectors.Upsert(ctx, id, embedding); err != nil {
+		// Best-effort rollback: remove the orphaned store entry.
+		_ = s.store.Delete(ctx, id)
+		return nil, fmt.Errorf("upserting vector: %w", err)
+	}
+
+	return &RememberResult{MemoryID: id}, nil
+}
+
+// Search embeds the query, searches the vector store, fetches entries, and
+// increments access counts.
+func (s *Service) Search(ctx context.Context, query string, memType *Type, topK int) ([]ScoredEntry, error) {
+	if topK <= 0 {
+		topK = 10
+	}
+	embedding, err := s.embedder.Embed(ctx, query)
+	if err != nil {
+		return nil, fmt.Errorf("embedding query: %w", err)
+	}
+
+	active := EntryStatusActive
+	ids, err := s.vectors.Search(ctx, embedding, topK, VectorFilter{Type: memType, Status: &active})
+	if err != nil {
+		return nil, fmt.Errorf("vector search: %w", err)
+	}
+
+	var results []ScoredEntry
+	for _, scored := range ids {
+		entry, err := s.store.Get(ctx, scored.ID)
+		if err != nil {
+			s.log.Warn("skipping missing entry", zap.String("id", scored.ID), zap.Error(err))
+			continue
+		}
+		// Increment access count; failure is non-fatal.
+		_ = s.store.IncrementAccess(ctx, scored.ID)
+		// Composite score: boost by trust, penalise by staleness.
+		composite := scored.Similarity * entry.TrustScore * (1 - stalenessSearchPenaltyWeight*entry.StalenessScore)
+		results = append(results, ScoredEntry{Entry: entry, Similarity: composite})
+	}
+	sort.Slice(results, func(i, j int) bool {
+		return results[i].Similarity > results[j].Similarity
+	})
+	return results, nil
+}
+
+// detectConflicts returns any existing entries whose embedding similarity to
+// the candidate exceeds conflictSimilarityThreshold.
+func (s *Service) detectConflicts(ctx context.Context, embedding []float32, memType Type) ([]ConflictResult, error) {
+	active := EntryStatusActive
+	candidates, err := s.vectors.Search(ctx, embedding, defaultConflictTopK, VectorFilter{
+		Type:   &memType,
+		Status: &active,
+	})
+	if err != nil {
+		return nil, err
+	}
+
+	var conflicts []ConflictResult
+	for _, c := range candidates {
+		if c.Similarity < conflictSimilarityThreshold {
+			continue
+		}
+		entry, err := s.store.Get(ctx, c.ID)
+		if err != nil {
+			// Skip entries that can't be fetched; they may have been deleted concurrently.
+			s.log.Warn("skipping conflict candidate", zap.String("id", c.ID), zap.Error(err))
+			continue
+		}
+		conflicts = append(conflicts, ConflictResult{
+			ID:         entry.ID,
+			Content:    entry.Content,
+			Similarity: c.Similarity,
+			TrustScore: entry.TrustScore,
+		})
+	}
+	return conflicts, nil
+}
+
+func sourceOrDefault(s SourceType) SourceType {
+	if s == "" {
+		return SourceMemory
+	}
+	return s
+}
diff --git a/pkg/memory/service_test.go b/pkg/memory/service_test.go
new file mode 100644
index 0000000000..8e0d721acc
--- /dev/null
+++ b/pkg/memory/service_test.go
@@ -0,0 +1,153 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package memory_test
+
+import (
+	"context"
+	"testing"
+	"time"
+
+	"github.com/stretchr/testify/require"
+	"go.uber.org/mock/gomock"
+	"go.uber.org/zap/zaptest"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+	"github.com/stacklok/toolhive/pkg/memory/mocks"
+)
+
+func TestService_Remember_NoConflict(t *testing.T) {
+	t.Parallel()
+	ctrl := gomock.NewController(t)
+	store := mocks.NewMockStore(ctrl)
+	vectors := mocks.NewMockVectorStore(ctrl)
+	embedder := mocks.NewMockEmbedder(ctrl)
+
+	emb := []float32{1, 0, 0}
+	embedder.EXPECT().Embed(gomock.Any(), "test fact").Return(emb, nil)
+	active := memory.EntryStatusActive
+	vectors.EXPECT().Search(gomock.Any(), emb, 5, memory.VectorFilter{
+		Type:   ptrOf(memory.TypeSemantic),
+		Status: &active,
+	}).Return(nil, nil)
+	store.EXPECT().Create(gomock.Any(), gomock.Any()).Return(nil)
+	vectors.EXPECT().Upsert(gomock.Any(), gomock.Any(), emb).Return(nil)
+
+	svc, err := memory.NewService(store, vectors, embedder, zaptest.NewLogger(t))
+	require.NoError(t, err)
+
+	result, err := svc.Remember(context.Background(), memory.RememberInput{
+		Content: "test fact",
+		Type:    memory.TypeSemantic,
+		Author:  memory.AuthorHuman,
+	})
+	require.NoError(t, err)
+	require.NotEmpty(t, result.MemoryID)
+	require.Empty(t, result.Conflicts)
+}
+
+func TestService_Remember_ConflictDetected(t *testing.T) {
+	t.Parallel()
+	ctrl := gomock.NewController(t)
+	store := mocks.NewMockStore(ctrl)
+	vectors := mocks.NewMockVectorStore(ctrl)
+	embedder := mocks.NewMockEmbedder(ctrl)
+
+	emb := []float32{1, 0, 0}
+	embedder.EXPECT().Embed(gomock.Any(), "conflicting fact").Return(emb, nil)
+	active := memory.EntryStatusActive
+	vectors.EXPECT().Search(gomock.Any(), emb, 5, memory.VectorFilter{
+		Type:   ptrOf(memory.TypeSemantic),
+		Status: &active,
+	}).Return([]memory.ScoredID{{ID: "mem_existing", Similarity: 0.92}}, nil)
+	store.EXPECT().Get(gomock.Any(), "mem_existing").Return(memory.Entry{
+		ID:      "mem_existing",
+		Content: "existing fact",
+	}, nil)
+
+	svc, err := memory.NewService(store, vectors, embedder, zaptest.NewLogger(t))
+	require.NoError(t, err)
+
+	result, err := svc.Remember(context.Background(), memory.RememberInput{
+		Content: "conflicting fact",
+		Type:    memory.TypeSemantic,
+		Author:  memory.AuthorAgent,
+	})
+	require.NoError(t, err)
+	require.Empty(t, result.MemoryID)
+	require.Len(t, result.Conflicts, 1)
+	require.Equal(t, "mem_existing", result.Conflicts[0].ID)
+}
+
+func TestService_Remember_Force(t *testing.T) {
+	t.Parallel()
+	ctrl := gomock.NewController(t)
+	store := mocks.NewMockStore(ctrl)
+	vectors := mocks.NewMockVectorStore(ctrl)
+	embedder := mocks.NewMockEmbedder(ctrl)
+
+	emb := []float32{1, 0, 0}
+	embedder.EXPECT().Embed(gomock.Any(), "forced fact").Return(emb, nil)
+	store.EXPECT().Create(gomock.Any(), gomock.Any()).Return(nil)
+	vectors.EXPECT().Upsert(gomock.Any(), gomock.Any(), emb).Return(nil)
+
+	svc, err := memory.NewService(store, vectors, embedder, zaptest.NewLogger(t))
+	require.NoError(t, err)
+
+	result, err := svc.Remember(context.Background(), memory.RememberInput{
+		Content: "forced fact",
+		Type:    memory.TypeSemantic,
+		Author:  memory.AuthorHuman,
+		Force:   true,
+	})
+	require.NoError(t, err)
+	require.NotEmpty(t, result.MemoryID)
+}
+
+func TestService_Search_CompositeScoring(t *testing.T) {
+	t.Parallel()
+	ctrl := gomock.NewController(t)
+	store := mocks.NewMockStore(ctrl)
+	vectors := mocks.NewMockVectorStore(ctrl)
+	embedder := mocks.NewMockEmbedder(ctrl)
+
+	emb := []float32{1, 0, 0}
+	embedder.EXPECT().Embed(gomock.Any(), "auth endpoint").Return(emb, nil)
+
+	active := memory.EntryStatusActive
+	// Two results: high raw similarity but stale/flagged vs lower similarity but fresh+trusted.
+	vectors.EXPECT().Search(gomock.Any(), emb, 10, memory.VectorFilter{Status: &active}).
+		Return([]memory.ScoredID{
+			{ID: "stale_high", Similarity: 0.95},
+			{ID: "fresh_low", Similarity: 0.80},
+		}, nil)
+
+	now := time.Now()
+	flagTime := now.Add(-24 * time.Hour)
+
+	store.EXPECT().Get(gomock.Any(), "stale_high").Return(memory.Entry{
+		ID: "stale_high", Author: memory.AuthorAgent,
+		TrustScore: 0.5, StalenessScore: 0.8, CreatedAt: now, FlaggedAt: &flagTime,
+	}, nil)
+	store.EXPECT().IncrementAccess(gomock.Any(), "stale_high").Return(nil)
+
+	store.EXPECT().Get(gomock.Any(), "fresh_low").Return(memory.Entry{
+		ID: "fresh_low", Author: memory.AuthorHuman,
+		TrustScore: 1.0, StalenessScore: 0.0, CreatedAt: now,
+	}, nil)
+	store.EXPECT().IncrementAccess(gomock.Any(), "fresh_low").Return(nil)
+
+	svc, err := memory.NewService(store, vectors, embedder, zaptest.NewLogger(t))
+	require.NoError(t, err)
+
+	results, err := svc.Search(context.Background(), "auth endpoint", nil, 0)
+	require.NoError(t, err)
+	require.Len(t, results, 2)
+
+	// fresh_low (composite ≈ 0.80) should rank above stale_high (0.95 × 0.5 × (1-0.3×0.8) ≈ 0.361)
+	require.Equal(t, "fresh_low", results[0].Entry.ID)
+	require.Equal(t, "stale_high", results[1].Entry.ID)
+	require.Greater(t, results[0].Similarity, results[1].Similarity)
+}
+
+func ptrOf[T any](v T) *T { return &v }
diff --git a/pkg/memory/sqlite/db.go b/pkg/memory/sqlite/db.go
new file mode 100644
index 0000000000..50a56d0ece
--- /dev/null
+++ b/pkg/memory/sqlite/db.go
@@ -0,0 +1,106 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+// Package sqlite provides SQLite-backed implementations of the memory.Store
+// and memory.VectorStore interfaces.
+package sqlite
+
+import (
+	"context"
+	"database/sql"
+	"embed"
+	"errors"
+	"fmt"
+	"io/fs"
+	"os"
+	"path/filepath"
+
+	"github.com/pressly/goose/v3"
+	_ "modernc.org/sqlite" // SQLite driver
+)
+
+//go:embed migrations/*.sql
+var migrations embed.FS
+
+// DB wraps a *sql.DB connection for the memory SQLite database.
+type DB struct {
+	db *sql.DB
+}
+
+// Open opens (or creates) the memory SQLite database at path.
+func Open(ctx context.Context, path string) (_ *DB, err error) {
+	if err := os.MkdirAll(filepath.Dir(path), 0750); err != nil {
+		return nil, fmt.Errorf("creating database directory: %w", err)
+	}
+
+	dsn := fmt.Sprintf("file:%s?_txlock=immediate", path)
+	sqlDB, err := sql.Open("sqlite", dsn)
+	if err != nil {
+		return nil, fmt.Errorf("opening database: %w", err)
+	}
+
+	success := false
+	defer func() {
+		if !success {
+			if closeErr := sqlDB.Close(); closeErr != nil {
+				err = errors.Join(err, fmt.Errorf("closing database after failure: %w", closeErr))
+			}
+		}
+	}()
+
+	sqlDB.SetMaxOpenConns(1)
+	sqlDB.SetMaxIdleConns(1)
+
+	if err = applyPragmas(sqlDB); err != nil {
+		return nil, err
+	}
+
+	if err = runMigrations(ctx, sqlDB); err != nil {
+		return nil, err
+	}
+
+	if err = sqlDB.PingContext(ctx); err != nil {
+		return nil, fmt.Errorf("verifying connection: %w", err)
+	}
+
+	success = true
+	return &DB{db: sqlDB}, nil
+}
+
+// Close closes the underlying database connection.
+func (d *DB) Close() error { return d.db.Close() }
+
+// DB returns the underlying *sql.DB.
+func (d *DB) DB() *sql.DB { return d.db }
+
+func applyPragmas(db *sql.DB) error {
+	for _, p := range []string{
+		"PRAGMA journal_mode=WAL",
+		"PRAGMA busy_timeout=5000",
+		"PRAGMA synchronous=NORMAL",
+		"PRAGMA foreign_keys=ON",
+		"PRAGMA cache_size=-2000",
+	} {
+		if _, err := db.Exec(p); err != nil {
+			return fmt.Errorf("applying pragma %q: %w", p, err)
+		}
+	}
+	return nil
+}
+
+func runMigrations(ctx context.Context, db *sql.DB) error {
+	migrationsFS, err := fs.Sub(migrations, "migrations")
+	if err != nil {
+		return fmt.Errorf("creating migrations sub-filesystem: %w", err)
+	}
+	provider, err := goose.NewProvider(goose.DialectSQLite3, db, migrationsFS,
+		goose.WithAllowOutofOrder(false),
+	)
+	if err != nil {
+		return fmt.Errorf("creating goose provider: %w", err)
+	}
+	if _, err := provider.Up(ctx); err != nil {
+		return fmt.Errorf("running migrations: %w", err)
+	}
+	return nil
+}
diff --git a/pkg/memory/sqlite/migrations/001_initial.sql b/pkg/memory/sqlite/migrations/001_initial.sql
new file mode 100644
index 0000000000..717f8061d9
--- /dev/null
+++ b/pkg/memory/sqlite/migrations/001_initial.sql
@@ -0,0 +1,60 @@
+-- +goose Up
+
+CREATE TABLE IF NOT EXISTS memory_entries (
+    id                TEXT PRIMARY KEY,
+    type              TEXT NOT NULL CHECK (type IN ('semantic','procedural')),
+    content           TEXT NOT NULL,
+    tags              TEXT NOT NULL DEFAULT '[]',   -- JSON array
+    author            TEXT NOT NULL CHECK (author IN ('human','agent')),
+    agent_id          TEXT NOT NULL DEFAULT '',
+    session_id        TEXT NOT NULL DEFAULT '',
+    source            TEXT NOT NULL CHECK (source IN ('memory','skill')),
+    skill_ref         TEXT NOT NULL DEFAULT '',
+    status            TEXT NOT NULL DEFAULT 'active'
+                          CHECK (status IN ('active','flagged','expired','archived')),
+    trust_score       REAL NOT NULL DEFAULT 0,
+    staleness_score   REAL NOT NULL DEFAULT 0,
+    access_count      INTEGER NOT NULL DEFAULT 0,
+    last_accessed_at  TEXT,
+    flagged_at        TEXT,
+    flag_reason       TEXT NOT NULL DEFAULT '',
+    ttl_days          INTEGER,
+    expires_at        TEXT,
+    archived_at       TEXT,
+    consolidated_into TEXT NOT NULL DEFAULT '',
+    crystallized_into TEXT NOT NULL DEFAULT '',
+    created_at        TEXT NOT NULL,
+    updated_at        TEXT NOT NULL
+);
+
+CREATE TABLE IF NOT EXISTS memory_revisions (
+    id              INTEGER PRIMARY KEY AUTOINCREMENT,
+    entry_id        TEXT NOT NULL REFERENCES memory_entries(id) ON DELETE CASCADE,
+    content         TEXT NOT NULL,
+    author          TEXT NOT NULL,
+    correction_note TEXT NOT NULL DEFAULT '',
+    created_at      TEXT NOT NULL
+);
+
+-- Embeddings stored as a JSON array of float32 values.
+-- Queries load all vectors for a type+status combination and compute
+-- cosine similarity in Go. Switch to an external VectorStore provider
+-- for datasets > 100K entries.
+CREATE TABLE IF NOT EXISTS memory_embeddings (
+    entry_id   TEXT PRIMARY KEY REFERENCES memory_entries(id) ON DELETE CASCADE,
+    embedding  TEXT NOT NULL  -- JSON []float32
+);
+
+CREATE INDEX IF NOT EXISTS idx_memory_entries_type_status
+    ON memory_entries(type, status);
+
+CREATE INDEX IF NOT EXISTS idx_memory_entries_expires_at
+    ON memory_entries(expires_at) WHERE expires_at IS NOT NULL;
+
+-- +goose Down
+
+DROP INDEX IF EXISTS idx_memory_entries_expires_at;
+DROP INDEX IF EXISTS idx_memory_entries_type_status;
+DROP TABLE IF EXISTS memory_embeddings;
+DROP TABLE IF EXISTS memory_revisions;
+DROP TABLE IF EXISTS memory_entries;
diff --git a/pkg/memory/sqlite/migrations/002_add_episodic_type.sql b/pkg/memory/sqlite/migrations/002_add_episodic_type.sql
new file mode 100644
index 0000000000..d614ce3d39
--- /dev/null
+++ b/pkg/memory/sqlite/migrations/002_add_episodic_type.sql
@@ -0,0 +1,83 @@
+-- +goose Up
+
+-- SQLite does not support ALTER COLUMN, so we recreate the table with the
+-- updated CHECK constraint to include the 'episodic' memory type.
+
+CREATE TABLE IF NOT EXISTS memory_entries_new (
+    id                TEXT PRIMARY KEY,
+    type              TEXT NOT NULL CHECK (type IN ('semantic','procedural','episodic')),
+    content           TEXT NOT NULL,
+    tags              TEXT NOT NULL DEFAULT '[]',
+    author            TEXT NOT NULL CHECK (author IN ('human','agent')),
+    agent_id          TEXT NOT NULL DEFAULT '',
+    session_id        TEXT NOT NULL DEFAULT '',
+    source            TEXT NOT NULL CHECK (source IN ('memory','skill')),
+    skill_ref         TEXT NOT NULL DEFAULT '',
+    status            TEXT NOT NULL DEFAULT 'active'
+                          CHECK (status IN ('active','flagged','expired','archived')),
+    trust_score       REAL NOT NULL DEFAULT 0,
+    staleness_score   REAL NOT NULL DEFAULT 0,
+    access_count      INTEGER NOT NULL DEFAULT 0,
+    last_accessed_at  TEXT,
+    flagged_at        TEXT,
+    flag_reason       TEXT NOT NULL DEFAULT '',
+    ttl_days          INTEGER,
+    expires_at        TEXT,
+    archived_at       TEXT,
+    consolidated_into TEXT NOT NULL DEFAULT '',
+    crystallized_into TEXT NOT NULL DEFAULT '',
+    created_at        TEXT NOT NULL,
+    updated_at        TEXT NOT NULL
+);
+
+INSERT INTO memory_entries_new SELECT * FROM memory_entries;
+DROP TABLE memory_entries;
+ALTER TABLE memory_entries_new RENAME TO memory_entries;
+
+CREATE INDEX IF NOT EXISTS idx_memory_entries_type_status
+    ON memory_entries(type, status);
+
+CREATE INDEX IF NOT EXISTS idx_memory_entries_expires_at
+    ON memory_entries(expires_at) WHERE expires_at IS NOT NULL;
+
+-- +goose Down
+
+-- Revert: drop episodic rows then recreate the narrower constraint.
+DELETE FROM memory_entries WHERE type = 'episodic';
+
+CREATE TABLE IF NOT EXISTS memory_entries_old (
+    id                TEXT PRIMARY KEY,
+    type              TEXT NOT NULL CHECK (type IN ('semantic','procedural')),
+    content           TEXT NOT NULL,
+    tags              TEXT NOT NULL DEFAULT '[]',
+    author            TEXT NOT NULL CHECK (author IN ('human','agent')),
+    agent_id          TEXT NOT NULL DEFAULT '',
+    session_id        TEXT NOT NULL DEFAULT '',
+    source            TEXT NOT NULL CHECK (source IN ('memory','skill')),
+    skill_ref         TEXT NOT NULL DEFAULT '',
+    status            TEXT NOT NULL DEFAULT 'active'
+                          CHECK (status IN ('active','flagged','expired','archived')),
+    trust_score       REAL NOT NULL DEFAULT 0,
+    staleness_score   REAL NOT NULL DEFAULT 0,
+    access_count      INTEGER NOT NULL DEFAULT 0,
+    last_accessed_at  TEXT,
+    flagged_at        TEXT,
+    flag_reason       TEXT NOT NULL DEFAULT '',
+    ttl_days          INTEGER,
+    expires_at        TEXT,
+    archived_at       TEXT,
+    consolidated_into TEXT NOT NULL DEFAULT '',
+    crystallized_into TEXT NOT NULL DEFAULT '',
+    created_at        TEXT NOT NULL,
+    updated_at        TEXT NOT NULL
+);
+
+INSERT INTO memory_entries_old SELECT * FROM memory_entries;
+DROP TABLE memory_entries;
+ALTER TABLE memory_entries_old RENAME TO memory_entries;
+
+CREATE INDEX IF NOT EXISTS idx_memory_entries_type_status
+    ON memory_entries(type, status);
+
+CREATE INDEX IF NOT EXISTS idx_memory_entries_expires_at
+    ON memory_entries(expires_at) WHERE expires_at IS NOT NULL;
diff --git a/pkg/memory/sqlite/store.go b/pkg/memory/sqlite/store.go
new file mode 100644
index 0000000000..80fe0c9eb0
--- /dev/null
+++ b/pkg/memory/sqlite/store.go
@@ -0,0 +1,364 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package sqlite
+
+import (
+	"context"
+	"database/sql"
+	"encoding/json"
+	"errors"
+	"fmt"
+	"time"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// Store implements memory.Store using SQLite.
+type Store struct {
+	db *sql.DB
+}
+
+// NewStore creates a new SQLite-backed Store.
+func NewStore(wrapper *DB) *Store {
+	return &Store{db: wrapper.DB()}
+}
+
+var _ memory.Store = (*Store)(nil)
+
+// Create inserts a new memory entry.
+func (s *Store) Create(ctx context.Context, e memory.Entry) error {
+	tags, err := json.Marshal(e.Tags)
+	if err != nil {
+		return fmt.Errorf("marshalling tags: %w", err)
+	}
+
+	_, err = s.db.ExecContext(ctx, `
+		INSERT INTO memory_entries
+			(id, type, content, tags, author, agent_id, session_id, source, skill_ref,
+			 status, trust_score, staleness_score, access_count, last_accessed_at,
+			 ttl_days, expires_at, created_at, updated_at)
+		VALUES (?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?)`,
+		e.ID, string(e.Type), e.Content, string(tags),
+		string(e.Author), e.AgentID, e.SessionID, string(e.Source), e.SkillRef,
+		string(e.Status), e.TrustScore, e.StalenessScore, e.AccessCount,
+		nullableTime(e.LastAccessedAt),
+		e.TTLDays, nullableTimePtr(e.ExpiresAt),
+		e.CreatedAt.UTC().Format(time.RFC3339Nano),
+		e.UpdatedAt.UTC().Format(time.RFC3339Nano),
+	)
+	return err
+}
+
+// Get retrieves a single entry by ID, including its revision history.
+func (s *Store) Get(ctx context.Context, id string) (memory.Entry, error) {
+	row := s.db.QueryRowContext(ctx, `
+		SELECT id, type, content, tags, author, agent_id, session_id, source, skill_ref,
+		       status, trust_score, staleness_score, access_count, last_accessed_at,
+		       flagged_at, flag_reason, ttl_days, expires_at, archived_at,
+		       consolidated_into, crystallized_into, created_at, updated_at
+		FROM memory_entries WHERE id = ?`, id)
+
+	e, err := scanEntry(row)
+	if errors.Is(err, sql.ErrNoRows) {
+		return memory.Entry{}, fmt.Errorf("entry %q: %w", id, memory.ErrNotFound)
+	}
+	if err != nil {
+		return memory.Entry{}, err
+	}
+
+	e.History, err = s.loadHistory(ctx, id)
+	return e, err
+}
+
+// Update replaces content and appends the old content to revisions.
+func (s *Store) Update(ctx context.Context, id, content string, author memory.AuthorType, note string) error {
+	tx, err := s.db.BeginTx(ctx, nil)
+	if err != nil {
+		return err
+	}
+	defer rollback(tx)
+
+	var oldContent string
+	if err := tx.QueryRowContext(ctx, `SELECT content FROM memory_entries WHERE id = ?`, id).Scan(&oldContent); err != nil {
+		if errors.Is(err, sql.ErrNoRows) {
+			return fmt.Errorf("entry %q: %w", id, memory.ErrNotFound)
+		}
+		return err
+	}
+
+	if _, err := tx.ExecContext(ctx,
+		`INSERT INTO memory_revisions (entry_id, content, author, correction_note, created_at)
+		 VALUES (?, ?, ?, ?, ?)`,
+		id, oldContent, string(author), note, time.Now().UTC().Format(time.RFC3339Nano),
+	); err != nil {
+		return err
+	}
+
+	if _, err := tx.ExecContext(ctx,
+		`UPDATE memory_entries SET content = ?, updated_at = ? WHERE id = ?`,
+		content, time.Now().UTC().Format(time.RFC3339Nano), id,
+	); err != nil {
+		return err
+	}
+
+	return tx.Commit()
+}
+
+// Flag marks an entry as potentially stale.
+func (s *Store) Flag(ctx context.Context, id, reason string) error {
+	now := time.Now().UTC().Format(time.RFC3339Nano)
+	_, err := s.db.ExecContext(ctx,
+		`UPDATE memory_entries SET status='flagged', flagged_at=?, flag_reason=?, updated_at=? WHERE id=?`,
+		now, reason, now, id)
+	return err
+}
+
+// Unflag clears the flag on an entry.
+func (s *Store) Unflag(ctx context.Context, id string) error {
+	now := time.Now().UTC().Format(time.RFC3339Nano)
+	_, err := s.db.ExecContext(ctx,
+		`UPDATE memory_entries SET status='active', flagged_at=NULL, flag_reason='', updated_at=? WHERE id=?`,
+		now, id)
+	return err
+}
+
+// Delete permanently removes an entry.
+func (s *Store) Delete(ctx context.Context, id string) error {
+	_, err := s.db.ExecContext(ctx, `DELETE FROM memory_entries WHERE id=?`, id)
+	return err
+}
+
+// List returns entries matching the filter.
+func (s *Store) List(ctx context.Context, f memory.ListFilter) ([]memory.Entry, error) {
+	query := `SELECT id, type, content, tags, author, agent_id, session_id, source, skill_ref,
+		       status, trust_score, staleness_score, access_count, last_accessed_at,
+		       flagged_at, flag_reason, ttl_days, expires_at, archived_at,
+		       consolidated_into, crystallized_into, created_at, updated_at
+		FROM memory_entries WHERE 1=1`
+	var args []any
+
+	if f.Type != nil {
+		query += " AND type=?"
+		args = append(args, string(*f.Type))
+	}
+	if f.Author != nil {
+		query += " AND author=?"
+		args = append(args, string(*f.Author))
+	}
+	if f.Source != nil {
+		query += " AND source=?"
+		args = append(args, string(*f.Source))
+	}
+	if f.Status != nil {
+		query += " AND status=?"
+		args = append(args, string(*f.Status))
+	}
+	if f.CreatedAfter != nil {
+		query += " AND created_at >= ?"
+		args = append(args, f.CreatedAfter.UTC().Format(time.RFC3339Nano))
+	}
+	if f.CreatedBefore != nil {
+		query += " AND created_at <= ?"
+		args = append(args, f.CreatedBefore.UTC().Format(time.RFC3339Nano))
+	}
+
+	query += " ORDER BY created_at DESC"
+	if f.Limit > 0 {
+		query += " LIMIT ? OFFSET ?"
+		args = append(args, f.Limit, f.Offset)
+	}
+
+	rows, err := s.db.QueryContext(ctx, query, args...)
+	if err != nil {
+		return nil, err
+	}
+	defer func() { _ = rows.Close() }()
+
+	var entries []memory.Entry
+	for rows.Next() {
+		e, err := scanEntry(rows)
+		if err != nil {
+			return nil, err
+		}
+		entries = append(entries, e)
+	}
+	return entries, rows.Err()
+}
+
+// Archive transitions an entry to archived status.
+func (s *Store) Archive(ctx context.Context, id string, reason memory.ArchiveReason, ref string) error {
+	now := time.Now().UTC().Format(time.RFC3339Nano)
+	field := consolidatedField(reason)
+	_, err := s.db.ExecContext(ctx,
+		fmt.Sprintf(`UPDATE memory_entries SET status='archived', archived_at=?, %s=?, updated_at=? WHERE id=?`, field),
+		now, ref, now, id)
+	return err
+}
+
+// IncrementAccess increments the access counter and updates last_accessed_at.
+func (s *Store) IncrementAccess(ctx context.Context, id string) error {
+	now := time.Now().UTC().Format(time.RFC3339Nano)
+	_, err := s.db.ExecContext(ctx,
+		`UPDATE memory_entries SET access_count=access_count+1, last_accessed_at=?, updated_at=? WHERE id=?`,
+		now, now, id)
+	return err
+}
+
+// UpdateScores persists recomputed trust and staleness scores.
+func (s *Store) UpdateScores(ctx context.Context, id string, trust, staleness float32) error {
+	_, err := s.db.ExecContext(ctx,
+		`UPDATE memory_entries SET trust_score=?, staleness_score=? WHERE id=?`,
+		trust, staleness, id)
+	return err
+}
+
+// ListExpired returns active entries whose TTL has elapsed.
+func (s *Store) ListExpired(ctx context.Context) ([]memory.Entry, error) {
+	now := time.Now().UTC().Format(time.RFC3339Nano)
+	rows, err := s.db.QueryContext(ctx,
+		`SELECT id, type, content, tags, author, agent_id, session_id, source, skill_ref,
+		        status, trust_score, staleness_score, access_count, last_accessed_at,
+		        flagged_at, flag_reason, ttl_days, expires_at, archived_at,
+		        consolidated_into, crystallized_into, created_at, updated_at
+		 FROM memory_entries
+		 WHERE expires_at IS NOT NULL AND expires_at <= ? AND status NOT IN ('expired','archived')`, now)
+	if err != nil {
+		return nil, err
+	}
+	defer func() { _ = rows.Close() }()
+	var entries []memory.Entry
+	for rows.Next() {
+		e, err := scanEntry(rows)
+		if err != nil {
+			return nil, err
+		}
+		entries = append(entries, e)
+	}
+	return entries, rows.Err()
+}
+
+// ListActive returns all active and flagged entries for score recomputation.
+func (s *Store) ListActive(ctx context.Context) ([]memory.Entry, error) {
+	rows, err := s.db.QueryContext(ctx,
+		`SELECT id, type, content, tags, author, agent_id, session_id, source, skill_ref,
+		        status, trust_score, staleness_score, access_count, last_accessed_at,
+		        flagged_at, flag_reason, ttl_days, expires_at, archived_at,
+		        consolidated_into, crystallized_into, created_at, updated_at
+		 FROM memory_entries WHERE status IN ('active','flagged')`)
+	if err != nil {
+		return nil, err
+	}
+	defer func() { _ = rows.Close() }()
+	var entries []memory.Entry
+	for rows.Next() {
+		e, err := scanEntry(rows)
+		if err != nil {
+			return nil, err
+		}
+		entries = append(entries, e)
+	}
+	return entries, rows.Err()
+}
+
+// ---- helpers ----
+
+type scanner interface {
+	Scan(dest ...any) error
+}
+
+func scanEntry(sc scanner) (memory.Entry, error) {
+	var e memory.Entry
+	var (
+		mtype, author, source, status string
+		tagsJSON                      string
+		lastAccessed, flaggedAt       sql.NullString
+		expiresAt, archivedAt         sql.NullString
+		createdAt, updatedAt          string
+	)
+	err := sc.Scan(
+		&e.ID, &mtype, &e.Content, &tagsJSON, &author,
+		&e.AgentID, &e.SessionID, &source, &e.SkillRef,
+		&status, &e.TrustScore, &e.StalenessScore, &e.AccessCount, &lastAccessed,
+		&flaggedAt, &e.FlagReason, &e.TTLDays, &expiresAt, &archivedAt,
+		&e.ConsolidatedInto, &e.CrystallizedInto, &createdAt, &updatedAt,
+	)
+	if err != nil {
+		return memory.Entry{}, err
+	}
+	e.Type = memory.Type(mtype)
+	e.Author = memory.AuthorType(author)
+	e.Source = memory.SourceType(source)
+	e.Status = memory.EntryStatus(status)
+	_ = json.Unmarshal([]byte(tagsJSON), &e.Tags)
+	e.CreatedAt, _ = parseTime(createdAt)
+	e.UpdatedAt, _ = parseTime(updatedAt)
+	if lastAccessed.Valid {
+		t, _ := parseTime(lastAccessed.String)
+		e.LastAccessedAt = t
+	}
+	if flaggedAt.Valid {
+		t, _ := parseTime(flaggedAt.String)
+		e.FlaggedAt = &t
+	}
+	if expiresAt.Valid {
+		t, _ := parseTime(expiresAt.String)
+		e.ExpiresAt = &t
+	}
+	if archivedAt.Valid {
+		t, _ := parseTime(archivedAt.String)
+		e.ArchivedAt = &t
+	}
+	return e, nil
+}
+
+func (s *Store) loadHistory(ctx context.Context, entryID string) ([]memory.Revision, error) {
+	rows, err := s.db.QueryContext(ctx,
+		`SELECT content, author, correction_note, created_at
+		 FROM memory_revisions WHERE entry_id=? ORDER BY created_at ASC`, entryID)
+	if err != nil {
+		return nil, err
+	}
+	defer func() { _ = rows.Close() }()
+	var revs []memory.Revision
+	for rows.Next() {
+		var r memory.Revision
+		var author, createdAt string
+		if err := rows.Scan(&r.Content, &author, &r.CorrectionNote, &createdAt); err != nil {
+			return nil, err
+		}
+		r.Author = memory.AuthorType(author)
+		r.Timestamp, _ = parseTime(createdAt)
+		revs = append(revs, r)
+	}
+	return revs, rows.Err()
+}
+
+func nullableTime(t time.Time) any {
+	if t.IsZero() {
+		return nil
+	}
+	return t.UTC().Format(time.RFC3339Nano)
+}
+
+func nullableTimePtr(t *time.Time) any {
+	if t == nil {
+		return nil
+	}
+	return t.UTC().Format(time.RFC3339Nano)
+}
+
+func parseTime(s string) (time.Time, error) {
+	return time.Parse(time.RFC3339Nano, s)
+}
+
+func consolidatedField(reason memory.ArchiveReason) string {
+	if reason == memory.ArchiveReasonCrystallized {
+		return "crystallized_into"
+	}
+	return "consolidated_into"
+}
+
+func rollback(tx *sql.Tx) {
+	_ = tx.Rollback()
+}
diff --git a/pkg/memory/sqlite/store_test.go b/pkg/memory/sqlite/store_test.go
new file mode 100644
index 0000000000..8b009d12b6
--- /dev/null
+++ b/pkg/memory/sqlite/store_test.go
@@ -0,0 +1,167 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package sqlite_test
+
+import (
+	"context"
+	"fmt"
+	"path/filepath"
+	"testing"
+	"time"
+
+	"github.com/stretchr/testify/require"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+	memorysqlite "github.com/stacklok/toolhive/pkg/memory/sqlite"
+)
+
+func openTestDB(t *testing.T) *memorysqlite.DB {
+	t.Helper()
+	dir := t.TempDir()
+	resolved, _ := filepath.EvalSymlinks(dir)
+	db, err := memorysqlite.Open(context.Background(), filepath.Join(resolved, "memory.db"))
+	require.NoError(t, err)
+	t.Cleanup(func() { _ = db.Close() })
+	return db
+}
+
+func TestMemoryStore_CreateAndGet(t *testing.T) {
+	t.Parallel()
+	db := openTestDB(t)
+	store := memorysqlite.NewStore(db)
+
+	entry := memory.Entry{
+		ID:        "mem_test_001",
+		Type:      memory.TypeSemantic,
+		Content:   "we deploy to us-east-1",
+		Tags:      []string{"deployment", "infra"},
+		Author:    memory.AuthorHuman,
+		Source:    memory.SourceMemory,
+		Status:    memory.EntryStatusActive,
+		CreatedAt: time.Now(),
+		UpdatedAt: time.Now(),
+	}
+
+	err := store.Create(context.Background(), entry)
+	require.NoError(t, err)
+
+	got, err := store.Get(context.Background(), "mem_test_001")
+	require.NoError(t, err)
+	require.Equal(t, entry.ID, got.ID)
+	require.Equal(t, entry.Content, got.Content)
+	require.Equal(t, entry.Tags, got.Tags)
+	require.Equal(t, entry.Author, got.Author)
+	require.Equal(t, entry.Status, got.Status)
+}
+
+func TestMemoryStore_Update(t *testing.T) {
+	t.Parallel()
+	db := openTestDB(t)
+	store := memorysqlite.NewStore(db)
+
+	entry := memory.Entry{
+		ID:        "mem_test_002",
+		Type:      memory.TypeSemantic,
+		Content:   "old content",
+		Author:    memory.AuthorHuman,
+		Source:    memory.SourceMemory,
+		Status:    memory.EntryStatusActive,
+		CreatedAt: time.Now(),
+		UpdatedAt: time.Now(),
+	}
+	require.NoError(t, store.Create(context.Background(), entry))
+
+	err := store.Update(context.Background(), "mem_test_002", "new content", memory.AuthorHuman, "corrected")
+	require.NoError(t, err)
+
+	got, err := store.Get(context.Background(), "mem_test_002")
+	require.NoError(t, err)
+	require.Equal(t, "new content", got.Content)
+	require.Len(t, got.History, 1)
+	require.Equal(t, "old content", got.History[0].Content)
+	require.Equal(t, "corrected", got.History[0].CorrectionNote)
+}
+
+func TestMemoryStore_Archive(t *testing.T) {
+	t.Parallel()
+	db := openTestDB(t)
+	store := memorysqlite.NewStore(db)
+
+	entry := memory.Entry{
+		ID:        "mem_test_003",
+		Type:      memory.TypeProcedural,
+		Content:   "check Docker health before E2E tests",
+		Author:    memory.AuthorAgent,
+		Source:    memory.SourceMemory,
+		Status:    memory.EntryStatusActive,
+		CreatedAt: time.Now(),
+		UpdatedAt: time.Now(),
+	}
+	require.NoError(t, store.Create(context.Background(), entry))
+
+	err := store.Archive(context.Background(), "mem_test_003", memory.ArchiveReasonConsolidated, "mem_test_consolidated")
+	require.NoError(t, err)
+
+	got, err := store.Get(context.Background(), "mem_test_003")
+	require.NoError(t, err)
+	require.Equal(t, memory.EntryStatusArchived, got.Status)
+	require.Equal(t, "mem_test_consolidated", got.ConsolidatedInto)
+	require.NotNil(t, got.ArchivedAt)
+}
+
+func TestMemoryStore_List(t *testing.T) {
+	t.Parallel()
+	db := openTestDB(t)
+	store := memorysqlite.NewStore(db)
+
+	ctx := context.Background()
+	for i, content := range []string{"fact A", "fact B", "procedure X"} {
+		mtype := memory.TypeSemantic
+		if i == 2 {
+			mtype = memory.TypeProcedural
+		}
+		require.NoError(t, store.Create(ctx, memory.Entry{
+			ID:        fmt.Sprintf("mem_list_%d", i),
+			Type:      mtype,
+			Content:   content,
+			Author:    memory.AuthorHuman,
+			Source:    memory.SourceMemory,
+			Status:    memory.EntryStatusActive,
+			CreatedAt: time.Now(),
+			UpdatedAt: time.Now(),
+		}))
+	}
+
+	sem := memory.TypeSemantic
+	results, err := store.List(ctx, memory.ListFilter{Type: &sem, Limit: 10})
+	require.NoError(t, err)
+	require.Len(t, results, 2)
+}
+
+func TestMemoryStore_ListTimeRange(t *testing.T) {
+	t.Parallel()
+	db := openTestDB(t)
+	store := memorysqlite.NewStore(db)
+	ctx := context.Background()
+
+	past := time.Now().Add(-2 * time.Hour)
+	recent := time.Now().Add(-30 * time.Minute)
+
+	require.NoError(t, store.Create(ctx, memory.Entry{
+		ID: "mem_old", Type: memory.TypeEpisodic, Content: "old event",
+		Author: memory.AuthorAgent, Source: memory.SourceMemory, Status: memory.EntryStatusActive,
+		CreatedAt: past, UpdatedAt: past,
+	}))
+	require.NoError(t, store.Create(ctx, memory.Entry{
+		ID: "mem_new", Type: memory.TypeEpisodic, Content: "recent event",
+		Author: memory.AuthorAgent, Source: memory.SourceMemory, Status: memory.EntryStatusActive,
+		CreatedAt: recent, UpdatedAt: recent,
+	}))
+
+	cutoff := time.Now().Add(-1 * time.Hour)
+	results, err := store.List(ctx, memory.ListFilter{CreatedAfter: &cutoff})
+	require.NoError(t, err)
+	require.Len(t, results, 1)
+	require.Equal(t, "mem_new", results[0].ID)
+}
diff --git a/pkg/memory/sqlite/vector.go b/pkg/memory/sqlite/vector.go
new file mode 100644
index 0000000000..49b1cb5d6f
--- /dev/null
+++ b/pkg/memory/sqlite/vector.go
@@ -0,0 +1,127 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package sqlite
+
+import (
+	"context"
+	"database/sql"
+	"encoding/json"
+	"fmt"
+	"math"
+	"sort"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// VectorStore implements memory.VectorStore using SQLite blob storage and
+// Go-native cosine similarity. Suitable for datasets up to ~100K entries.
+// Use an external VectorStore (Qdrant, pgvector) for larger datasets.
+type VectorStore struct {
+	db *sql.DB
+}
+
+// NewVectorStore creates a new SQLite-backed VectorStore.
+func NewVectorStore(wrapper *DB) *VectorStore {
+	return &VectorStore{db: wrapper.DB()}
+}
+
+var _ memory.VectorStore = (*VectorStore)(nil)
+
+// Upsert stores or replaces the embedding for entry id.
+func (v *VectorStore) Upsert(ctx context.Context, id string, embedding []float32) error {
+	data, err := json.Marshal(embedding)
+	if err != nil {
+		return fmt.Errorf("marshalling embedding: %w", err)
+	}
+	_, err = v.db.ExecContext(ctx,
+		`INSERT INTO memory_embeddings (entry_id, embedding) VALUES (?,?)
+		 ON CONFLICT(entry_id) DO UPDATE SET embedding=excluded.embedding`,
+		id, string(data))
+	return err
+}
+
+// Search loads all embeddings matching the filter, computes cosine similarity
+// against query, and returns the topK results in descending score order.
+func (v *VectorStore) Search(
+	ctx context.Context, query []float32, topK int, filter memory.VectorFilter,
+) ([]memory.ScoredID, error) {
+	q := `SELECT e.entry_id, e.embedding
+		  FROM memory_embeddings e
+		  JOIN memory_entries m ON m.id = e.entry_id
+		  WHERE 1=1`
+	var args []any
+	if filter.Type != nil {
+		q += " AND m.type=?"
+		args = append(args, string(*filter.Type))
+	}
+	if filter.Status != nil {
+		q += " AND m.status=?"
+		args = append(args, string(*filter.Status))
+	}
+
+	rows, err := v.db.QueryContext(ctx, q, args...)
+	if err != nil {
+		return nil, err
+	}
+	defer func() { _ = rows.Close() }()
+
+	qNorm := l2Norm(query)
+	if qNorm == 0 {
+		return nil, fmt.Errorf("query vector has zero magnitude")
+	}
+
+	var scored []memory.ScoredID
+	for rows.Next() {
+		var id, embJSON string
+		if err := rows.Scan(&id, &embJSON); err != nil {
+			return nil, err
+		}
+		var emb []float32
+		if err := json.Unmarshal([]byte(embJSON), &emb); err != nil {
+			continue
+		}
+		sim := cosineSimilarity(query, emb, qNorm)
+		scored = append(scored, memory.ScoredID{ID: id, Similarity: sim})
+	}
+	if err := rows.Err(); err != nil {
+		return nil, err
+	}
+
+	sort.Slice(scored, func(i, j int) bool {
+		return scored[i].Similarity > scored[j].Similarity
+	})
+	if topK > 0 && len(scored) > topK {
+		scored = scored[:topK]
+	}
+	return scored, nil
+}
+
+// Delete removes the embedding for entry id.
+func (v *VectorStore) Delete(ctx context.Context, id string) error {
+	_, err := v.db.ExecContext(ctx, `DELETE FROM memory_embeddings WHERE entry_id=?`, id)
+	return err
+}
+
+func cosineSimilarity(a, b []float32, aNorm float32) float32 {
+	if len(a) != len(b) || aNorm == 0 {
+		return 0
+	}
+	bNorm := l2Norm(b)
+	if bNorm == 0 {
+		return 0
+	}
+	var dot float64
+	for i := range a {
+		dot += float64(a[i]) * float64(b[i])
+	}
+	return float32(dot / (float64(aNorm) * float64(bNorm)))
+}
+
+func l2Norm(v []float32) float32 {
+	var sum float64
+	for _, x := range v {
+		sum += float64(x) * float64(x)
+	}
+	return float32(math.Sqrt(sum))
+}
diff --git a/pkg/memory/sqlite/vector_test.go b/pkg/memory/sqlite/vector_test.go
new file mode 100644
index 0000000000..b613db0edc
--- /dev/null
+++ b/pkg/memory/sqlite/vector_test.go
@@ -0,0 +1,74 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package sqlite_test
+
+import (
+	"context"
+	"testing"
+
+	"github.com/stretchr/testify/require"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+	memorysqlite "github.com/stacklok/toolhive/pkg/memory/sqlite"
+)
+
+func TestVectorStore_UpsertAndSearch(t *testing.T) {
+	t.Parallel()
+	db := openTestDB(t)
+	store := memorysqlite.NewStore(db)
+	vectors := memorysqlite.NewVectorStore(db)
+
+	ctx := context.Background()
+
+	entries := []struct {
+		id        string
+		embedding []float32
+	}{
+		{"vec_001", []float32{1, 0, 0}},
+		{"vec_002", []float32{0.9, 0.1, 0}},
+		{"vec_003", []float32{0, 0, 1}},
+	}
+	for _, e := range entries {
+		require.NoError(t, store.Create(ctx, memory.Entry{
+			ID: e.id, Type: memory.TypeSemantic, Content: "c",
+			Author: memory.AuthorAgent, Source: memory.SourceMemory,
+			Status: memory.EntryStatusActive,
+		}))
+		require.NoError(t, vectors.Upsert(ctx, e.id, e.embedding))
+	}
+
+	query := []float32{0.95, 0.05, 0}
+	results, err := vectors.Search(ctx, query, 2, memory.VectorFilter{})
+	require.NoError(t, err)
+	require.Len(t, results, 2)
+
+	ids := []string{results[0].ID, results[1].ID}
+	require.Contains(t, ids, "vec_001")
+	require.Contains(t, ids, "vec_002")
+	require.NotContains(t, ids, "vec_003")
+
+	require.GreaterOrEqual(t, results[0].Similarity, results[1].Similarity)
+}
+
+func TestVectorStore_Delete(t *testing.T) {
+	t.Parallel()
+	db := openTestDB(t)
+	store := memorysqlite.NewStore(db)
+	vectors := memorysqlite.NewVectorStore(db)
+
+	ctx := context.Background()
+	require.NoError(t, store.Create(ctx, memory.Entry{
+		ID: "vec_del", Type: memory.TypeSemantic, Content: "c",
+		Author: memory.AuthorAgent, Source: memory.SourceMemory,
+		Status: memory.EntryStatusActive,
+	}))
+	require.NoError(t, vectors.Upsert(ctx, "vec_del", []float32{1, 0, 0}))
+	require.NoError(t, vectors.Delete(ctx, "vec_del"))
+
+	results, err := vectors.Search(ctx, []float32{1, 0, 0}, 5, memory.VectorFilter{})
+	require.NoError(t, err)
+	for _, r := range results {
+		require.NotEqual(t, "vec_del", r.ID)
+	}
+}
diff --git a/pkg/memory/types.go b/pkg/memory/types.go
index 04fa0b1754..4af892eb74 100644
--- a/pkg/memory/types.go
+++ b/pkg/memory/types.go
@@ -6,16 +6,19 @@ package memory
 
 import "time"
 
-// MemoryType distinguishes the two long-term memory namespaces.
-//
-//nolint:revive // MemoryType is the canonical cross-package name; renaming to Type causes ambiguity.
-type MemoryType string
+// Type distinguishes the two long-term memory namespaces.
+type Type string
 
 const (
-	// MemoryTypeSemantic represents factual knowledge and world-state memories.
-	MemoryTypeSemantic MemoryType = "semantic"
-	// MemoryTypeProcedural represents how-to knowledge and step-based memories.
-	MemoryTypeProcedural MemoryType = "procedural"
+	// TypeSemantic represents factual, aggregated knowledge and world-state memories
+	// (e.g. "company does not sponsor visas"). Contrast with TypeEpisodic.
+	TypeSemantic Type = "semantic"
+	// TypeProcedural represents how-to knowledge and step-based memories.
+	TypeProcedural Type = "procedural"
+	// TypeEpisodic represents time-indexed event records tied to a specific
+	// moment (e.g. "recruiter archived candidate on 2024-03-15 — visa required").
+	// Use CreatedAfter/CreatedBefore in ListFilter to query timelines.
+	TypeEpisodic Type = "episodic"
 )
 
 // AuthorType records whether a memory was written by a human or an agent.
@@ -67,12 +70,10 @@ const (
 	ArchiveReasonExpired ArchiveReason = "expired"
 )
 
-// MemoryEntry is the core domain type representing one stored memory.
-//
-//nolint:revive // MemoryEntry is the canonical cross-package name; renaming to Entry conflicts with common identifiers.
-type MemoryEntry struct {
+// Entry is the core domain type representing one stored memory.
+type Entry struct {
 	ID               string
-	Type             MemoryType
+	Type             Type
 	Content          string
 	Tags             []string
 	Author           AuthorType
@@ -92,15 +93,13 @@ type MemoryEntry struct {
 	ArchivedAt       *time.Time
 	ConsolidatedInto string
 	CrystallizedInto string
-	History          []MemoryRevision
+	History          []Revision
 	CreatedAt        time.Time
 	UpdatedAt        time.Time
 }
 
-// MemoryRevision records a single correction to a memory entry.
-//
-//nolint:revive // MemoryRevision is the canonical cross-package name; renaming to Revision causes ambiguity.
-type MemoryRevision struct {
+// Revision records a single correction to a memory entry.
+type Revision struct {
 	Content        string
 	Author         AuthorType
 	CorrectionNote string
@@ -109,18 +108,20 @@ type MemoryRevision struct {
 
 // ListFilter restricts results returned by MemoryStore.List.
 type ListFilter struct {
-	Type   *MemoryType
-	Author *AuthorType
-	Tags   []string
-	Source *SourceType
-	Status *EntryStatus
-	Limit  int
-	Offset int
+	Type          *Type
+	Author        *AuthorType
+	Tags          []string
+	Source        *SourceType
+	Status        *EntryStatus
+	CreatedAfter  *time.Time
+	CreatedBefore *time.Time
+	Limit         int
+	Offset        int
 }
 
 // VectorFilter restricts similarity search to a subset of entries.
 type VectorFilter struct {
-	Type   *MemoryType
+	Type   *Type
 	Status *EntryStatus
 }
 
@@ -130,9 +131,9 @@ type ScoredID struct {
 	Similarity float32
 }
 
-// ScoredEntry pairs a full MemoryEntry with its similarity to a query.
+// ScoredEntry pairs a full Entry with its similarity to a query.
 type ScoredEntry struct {
-	Entry      MemoryEntry
+	Entry      Entry
 	Similarity float32
 }
 
diff --git a/pkg/memory/types_test.go b/pkg/memory/types_test.go
index 86b255f32f..8163259793 100644
--- a/pkg/memory/types_test.go
+++ b/pkg/memory/types_test.go
@@ -13,12 +13,19 @@ import (
 
 func TestMemoryTypeConstants(t *testing.T) {
 	t.Parallel()
-	require.Equal(t, memory.MemoryType("semantic"), memory.MemoryTypeSemantic)
-	require.Equal(t, memory.MemoryType("procedural"), memory.MemoryTypeProcedural)
+	require.Equal(t, memory.Type("semantic"), memory.TypeSemantic)
+	require.Equal(t, memory.Type("procedural"), memory.TypeProcedural)
+	require.Equal(t, memory.Type("episodic"), memory.TypeEpisodic)
 	require.Equal(t, memory.AuthorType("human"), memory.AuthorHuman)
 	require.Equal(t, memory.AuthorType("agent"), memory.AuthorAgent)
 	require.Equal(t, memory.EntryStatus("active"), memory.EntryStatusActive)
 	require.Equal(t, memory.EntryStatus("flagged"), memory.EntryStatusFlagged)
 	require.Equal(t, memory.EntryStatus("expired"), memory.EntryStatusExpired)
 	require.Equal(t, memory.EntryStatus("archived"), memory.EntryStatusArchived)
+	require.Equal(t, memory.SourceType("memory"), memory.SourceMemory)
+	require.Equal(t, memory.SourceType("skill"), memory.SourceSkill)
+	require.Equal(t, memory.ArchiveReason("consolidated"), memory.ArchiveReasonConsolidated)
+	require.Equal(t, memory.ArchiveReason("crystallized"), memory.ArchiveReasonCrystallized)
+	require.Equal(t, memory.ArchiveReason("manual"), memory.ArchiveReasonManual)
+	require.Equal(t, memory.ArchiveReason("expired"), memory.ArchiveReasonExpired)
 }

From 1a30338a5798d2523670f35f873eeafe2b1bcc97 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Wed, 22 Apr 2026 10:56:20 -0400
Subject: [PATCH 04/23] Add thv-memory MCP server binary

Standalone MCP server exposing 9 memory tools over streamable HTTP
(/mcp endpoint, /health liveness probe). Wires SQLite store and vector
store, Ollama embedder, and a background lifecycle job that runs every
24h to expire TTL'd entries and recompute trust/staleness scores.

Tools: memory_remember, memory_search, memory_recall, memory_forget,
memory_update, memory_flag, memory_list, memory_consolidate,
memory_crystallize.

Config via memory-server.yaml with defaults (SQLite + sqlite-vec +
Ollama on localhost:11434, listening on 0.0.0.0:8080).

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 cmd/thv-memory/config.go             | 112 ++++++++++++++++++++++++
 cmd/thv-memory/integration_test.go   | 114 ++++++++++++++++++++++++
 cmd/thv-memory/lifecycle/job.go      |  84 ++++++++++++++++++
 cmd/thv-memory/lifecycle/job_test.go |  55 ++++++++++++
 cmd/thv-memory/main.go               | 124 +++++++++++++++++++++++++++
 cmd/thv-memory/server.go             |  46 ++++++++++
 cmd/thv-memory/tools/consolidate.go  |  69 +++++++++++++++
 cmd/thv-memory/tools/crystallize.go  |  74 ++++++++++++++++
 cmd/thv-memory/tools/flag.go         |  30 +++++++
 cmd/thv-memory/tools/forget.go       |  28 ++++++
 cmd/thv-memory/tools/list.go         |  47 ++++++++++
 cmd/thv-memory/tools/recall.go       |  36 ++++++++
 cmd/thv-memory/tools/remember.go     |  58 +++++++++++++
 cmd/thv-memory/tools/search.go       |  45 ++++++++++
 cmd/thv-memory/tools/update.go       |  44 ++++++++++
 15 files changed, 966 insertions(+)
 create mode 100644 cmd/thv-memory/config.go
 create mode 100644 cmd/thv-memory/integration_test.go
 create mode 100644 cmd/thv-memory/lifecycle/job.go
 create mode 100644 cmd/thv-memory/lifecycle/job_test.go
 create mode 100644 cmd/thv-memory/main.go
 create mode 100644 cmd/thv-memory/server.go
 create mode 100644 cmd/thv-memory/tools/consolidate.go
 create mode 100644 cmd/thv-memory/tools/crystallize.go
 create mode 100644 cmd/thv-memory/tools/flag.go
 create mode 100644 cmd/thv-memory/tools/forget.go
 create mode 100644 cmd/thv-memory/tools/list.go
 create mode 100644 cmd/thv-memory/tools/recall.go
 create mode 100644 cmd/thv-memory/tools/remember.go
 create mode 100644 cmd/thv-memory/tools/search.go
 create mode 100644 cmd/thv-memory/tools/update.go

diff --git a/cmd/thv-memory/config.go b/cmd/thv-memory/config.go
new file mode 100644
index 0000000000..98cda699d9
--- /dev/null
+++ b/cmd/thv-memory/config.go
@@ -0,0 +1,112 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+// Package main is the entry point for the ToolHive memory MCP server.
+package main
+
+import (
+	"fmt"
+	"os"
+
+	"gopkg.in/yaml.v3"
+)
+
+const (
+	providerOllama = "ollama"
+)
+
+// Config is the memory server configuration, loaded from memory-server.yaml.
+type Config struct {
+	Storage  StorageConfig  `yaml:"storage"`
+	Vector   VectorConfig   `yaml:"vector"`
+	Embedder EmbedderConfig `yaml:"embedder"`
+	Server   ServerConfig   `yaml:"server"`
+}
+
+// StorageConfig configures the Store backend.
+type StorageConfig struct {
+	Provider string `yaml:"provider"` // sqlite (default)
+	DSN      string `yaml:"dsn"`
+}
+
+// VectorConfig configures the VectorStore backend.
+type VectorConfig struct {
+	Provider string `yaml:"provider"` // sqlite-vec (default) | qdrant | pgvector
+	URL      string `yaml:"url"`
+}
+
+// EmbedderConfig configures the Embedder backend.
+type EmbedderConfig struct {
+	Provider string `yaml:"provider"` // ollama (default) | openai
+	URL      string `yaml:"url"`
+	Model    string `yaml:"model"`
+}
+
+// ServerConfig configures the MCP server itself.
+type ServerConfig struct {
+	Name           string `yaml:"name"`
+	Version        string `yaml:"version"`
+	Host           string `yaml:"host"`                     // default 0.0.0.0
+	Port           int    `yaml:"port"`                     // default 8080
+	LifecycleHours int    `yaml:"lifecycle_interval_hours"` // default 24
+}
+
+// LoadConfig reads and validates config from path. The path is operator-supplied
+// and expected to be a trusted config file location.
+func LoadConfig(path string) (*Config, error) {
+	// G304: path is an operator-supplied config file, not user input.
+	data, err := os.ReadFile(path) //nolint:gosec
+	if err != nil {
+		return nil, fmt.Errorf("reading config: %w", err)
+	}
+	var cfg Config
+	if err := yaml.Unmarshal(data, &cfg); err != nil {
+		return nil, fmt.Errorf("parsing config: %w", err)
+	}
+	applyStorageDefaults(&cfg)
+	applyEmbedderDefaults(&cfg)
+	applyServerDefaults(&cfg)
+	return &cfg, nil
+}
+
+func applyStorageDefaults(cfg *Config) {
+	if cfg.Storage.Provider == "" {
+		cfg.Storage.Provider = "sqlite"
+	}
+	if cfg.Storage.DSN == "" && cfg.Storage.Provider == "sqlite" {
+		cfg.Storage.DSN = "/data/memory.db"
+	}
+	if cfg.Vector.Provider == "" {
+		cfg.Vector.Provider = "sqlite-vec"
+	}
+}
+
+func applyEmbedderDefaults(cfg *Config) {
+	if cfg.Embedder.Provider == "" {
+		cfg.Embedder.Provider = providerOllama
+	}
+	if cfg.Embedder.Model == "" {
+		cfg.Embedder.Model = "nomic-embed-text"
+	}
+	if cfg.Embedder.URL == "" && cfg.Embedder.Provider == providerOllama {
+		cfg.Embedder.URL = "http://localhost:11434"
+	}
+}
+
+func applyServerDefaults(cfg *Config) {
+	if cfg.Server.Name == "" {
+		cfg.Server.Name = "toolhive-memory"
+	}
+	if cfg.Server.Version == "" {
+		cfg.Server.Version = "0.1.0"
+	}
+	if cfg.Server.Host == "" {
+		cfg.Server.Host = "0.0.0.0"
+	}
+	if cfg.Server.Port <= 0 {
+		cfg.Server.Port = 8080
+	}
+	if cfg.Server.LifecycleHours <= 0 {
+		cfg.Server.LifecycleHours = 24
+	}
+}
diff --git a/cmd/thv-memory/integration_test.go b/cmd/thv-memory/integration_test.go
new file mode 100644
index 0000000000..923abbd140
--- /dev/null
+++ b/cmd/thv-memory/integration_test.go
@@ -0,0 +1,114 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package main_test
+
+import (
+	"context"
+	"path/filepath"
+	"testing"
+
+	"github.com/stretchr/testify/require"
+	"go.uber.org/zap/zaptest"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+	memorysqlite "github.com/stacklok/toolhive/pkg/memory/sqlite"
+)
+
+// fakeEmbedder returns a deterministic embedding for testing without a real model server.
+type fakeEmbedder struct{}
+
+func (*fakeEmbedder) Embed(_ context.Context, text string) ([]float32, error) {
+	v := []float32{0, 0, 0}
+	for i, c := range text {
+		if i >= 3 {
+			break
+		}
+		v[i] = float32(c) / 128.0
+	}
+	return v, nil
+}
+
+func (*fakeEmbedder) Dimensions() int { return 3 }
+
+func TestIntegration_RememberSearchForget(t *testing.T) {
+	t.Parallel()
+	dir := t.TempDir()
+	resolved, _ := filepath.EvalSymlinks(dir)
+	db, err := memorysqlite.Open(context.Background(), filepath.Join(resolved, "test.db"))
+	require.NoError(t, err)
+	t.Cleanup(func() { _ = db.Close() })
+
+	store := memorysqlite.NewStore(db)
+	vectors := memorysqlite.NewVectorStore(db)
+	svc, err := memory.NewService(store, vectors, &fakeEmbedder{}, zaptest.NewLogger(t))
+	require.NoError(t, err)
+
+	ctx := context.Background()
+
+	r, err := svc.Remember(ctx, memory.RememberInput{
+		Content: "deploy to us-east-1",
+		Type:    memory.TypeSemantic,
+		Author:  memory.AuthorHuman,
+	})
+	require.NoError(t, err)
+	require.NotEmpty(t, r.MemoryID)
+	require.Empty(t, r.Conflicts)
+
+	results, err := svc.Search(ctx, "deploy to us-east-1", nil, 5)
+	require.NoError(t, err)
+	require.NotEmpty(t, results)
+	require.Equal(t, "deploy to us-east-1", results[0].Entry.Content)
+
+	entry, err := store.Get(ctx, r.MemoryID)
+	require.NoError(t, err)
+	require.Equal(t, 1, entry.AccessCount)
+
+	require.NoError(t, store.Delete(ctx, r.MemoryID))
+	_, err = store.Get(ctx, r.MemoryID)
+	require.ErrorIs(t, err, memory.ErrNotFound)
+}
+
+func TestIntegration_ConflictDetection(t *testing.T) {
+	t.Parallel()
+	dir := t.TempDir()
+	resolved, _ := filepath.EvalSymlinks(dir)
+	db, err := memorysqlite.Open(context.Background(), filepath.Join(resolved, "test2.db"))
+	require.NoError(t, err)
+	t.Cleanup(func() { _ = db.Close() })
+
+	store := memorysqlite.NewStore(db)
+	vectors := memorysqlite.NewVectorStore(db)
+	svc, err := memory.NewService(store, vectors, &fakeEmbedder{}, zaptest.NewLogger(t))
+	require.NoError(t, err)
+
+	ctx := context.Background()
+
+	r1, err := svc.Remember(ctx, memory.RememberInput{
+		Content: "auth port 8080",
+		Type:    memory.TypeSemantic,
+		Author:  memory.AuthorHuman,
+	})
+	require.NoError(t, err)
+	require.NotEmpty(t, r1.MemoryID)
+
+	// fakeEmbedder hashes first 3 chars — "aut" maps to same vector for both,
+	// so "auth port 9090" will have cosine similarity 1.0 with "auth port 8080".
+	r2, err := svc.Remember(ctx, memory.RememberInput{
+		Content: "auth port 9090",
+		Type:    memory.TypeSemantic,
+		Author:  memory.AuthorAgent,
+	})
+	require.NoError(t, err)
+	require.Empty(t, r2.MemoryID)
+	require.NotEmpty(t, r2.Conflicts)
+
+	r3, err := svc.Remember(ctx, memory.RememberInput{
+		Content: "auth port 9090",
+		Type:    memory.TypeSemantic,
+		Author:  memory.AuthorHuman,
+		Force:   true,
+	})
+	require.NoError(t, err)
+	require.NotEmpty(t, r3.MemoryID)
+}
diff --git a/cmd/thv-memory/lifecycle/job.go b/cmd/thv-memory/lifecycle/job.go
new file mode 100644
index 0000000000..bf1469dd01
--- /dev/null
+++ b/cmd/thv-memory/lifecycle/job.go
@@ -0,0 +1,84 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+// Package lifecycle provides the background maintenance job for memory entries.
+package lifecycle
+
+import (
+	"context"
+	"time"
+
+	"go.uber.org/zap"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// StalenessAuditThreshold is the score above which entries are logged as audit candidates.
+const StalenessAuditThreshold = float32(0.8)
+
+// Job runs periodic maintenance on the memory store: expiring TTL'd entries
+// and recomputing trust/staleness scores.
+type Job struct {
+	store memory.Store
+	log   *zap.Logger
+}
+
+// New creates a new lifecycle Job.
+func New(store memory.Store, log *zap.Logger) *Job {
+	return &Job{store: store, log: log}
+}
+
+// Run starts the background job, ticking at the given interval until ctx is cancelled.
+func (j *Job) Run(ctx context.Context, interval time.Duration) {
+	ticker := time.NewTicker(interval)
+	defer ticker.Stop()
+	for {
+		select {
+		case <-ctx.Done():
+			return
+		case <-ticker.C:
+			if err := j.RunOnce(ctx); err != nil {
+				j.log.Warn("lifecycle job error", zap.Error(err))
+			}
+		}
+	}
+}
+
+// RunOnce executes one maintenance pass: expire TTL'd entries, update scores.
+func (j *Job) RunOnce(ctx context.Context) error {
+	if err := j.expireEntries(ctx); err != nil {
+		return err
+	}
+	return j.recomputeScores(ctx)
+}
+
+func (j *Job) expireEntries(ctx context.Context) error {
+	expired, err := j.store.ListExpired(ctx)
+	if err != nil {
+		return err
+	}
+	for _, e := range expired {
+		if err := j.store.Archive(ctx, e.ID, memory.ArchiveReasonExpired, ""); err != nil {
+			j.log.Warn("failed to archive expired entry", zap.String("id", e.ID), zap.Error(err))
+		}
+	}
+	return nil
+}
+
+func (j *Job) recomputeScores(ctx context.Context) error {
+	entries, err := j.store.ListActive(ctx)
+	if err != nil {
+		return err
+	}
+	for _, e := range entries {
+		trust := memory.ComputeTrustScore(e)
+		staleness := memory.ComputeStalenessScore(e)
+		if err := j.store.UpdateScores(ctx, e.ID, trust, staleness); err != nil {
+			j.log.Warn("failed to update scores", zap.String("id", e.ID), zap.Error(err))
+		}
+		if staleness >= StalenessAuditThreshold {
+			j.log.Debug("high staleness entry", zap.String("id", e.ID), zap.Float32("staleness", staleness))
+		}
+	}
+	return nil
+}
diff --git a/cmd/thv-memory/lifecycle/job_test.go b/cmd/thv-memory/lifecycle/job_test.go
new file mode 100644
index 0000000000..a4302e3eaa
--- /dev/null
+++ b/cmd/thv-memory/lifecycle/job_test.go
@@ -0,0 +1,55 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package lifecycle_test
+
+import (
+	"context"
+	"testing"
+	"time"
+
+	"github.com/stretchr/testify/require"
+	"go.uber.org/mock/gomock"
+	"go.uber.org/zap/zaptest"
+
+	"github.com/stacklok/toolhive/cmd/thv-memory/lifecycle"
+	"github.com/stacklok/toolhive/pkg/memory"
+	"github.com/stacklok/toolhive/pkg/memory/mocks"
+)
+
+func TestJob_RunOnce_ExpiresEntries(t *testing.T) {
+	t.Parallel()
+	ctrl := gomock.NewController(t)
+	store := mocks.NewMockStore(ctrl)
+
+	expired := memory.Entry{
+		ID:        "mem_expired",
+		CreatedAt: time.Now().Add(-48 * time.Hour),
+	}
+	store.EXPECT().ListExpired(gomock.Any()).Return([]memory.Entry{expired}, nil)
+	store.EXPECT().Archive(gomock.Any(), "mem_expired", memory.ArchiveReasonExpired, "").Return(nil)
+	store.EXPECT().ListActive(gomock.Any()).Return(nil, nil)
+
+	job := lifecycle.New(store, zaptest.NewLogger(t))
+	err := job.RunOnce(context.Background())
+	require.NoError(t, err)
+}
+
+func TestJob_RunOnce_UpdatesScores(t *testing.T) {
+	t.Parallel()
+	ctrl := gomock.NewController(t)
+	store := mocks.NewMockStore(ctrl)
+
+	entry := memory.Entry{
+		ID:        "mem_active",
+		Author:    memory.AuthorHuman,
+		CreatedAt: time.Now(),
+	}
+	store.EXPECT().ListExpired(gomock.Any()).Return(nil, nil)
+	store.EXPECT().ListActive(gomock.Any()).Return([]memory.Entry{entry}, nil)
+	store.EXPECT().UpdateScores(gomock.Any(), "mem_active", gomock.Any(), gomock.Any()).Return(nil)
+
+	job := lifecycle.New(store, zaptest.NewLogger(t))
+	err := job.RunOnce(context.Background())
+	require.NoError(t, err)
+}
diff --git a/cmd/thv-memory/main.go b/cmd/thv-memory/main.go
new file mode 100644
index 0000000000..e4ed9d023d
--- /dev/null
+++ b/cmd/thv-memory/main.go
@@ -0,0 +1,124 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package main
+
+import (
+	"context"
+	"errors"
+	"fmt"
+	"log"
+	"net"
+	"net/http"
+	"os"
+	"os/signal"
+	"syscall"
+	"time"
+
+	"go.uber.org/zap"
+
+	"github.com/stacklok/toolhive/cmd/thv-memory/lifecycle"
+	"github.com/stacklok/toolhive/pkg/memory"
+	"github.com/stacklok/toolhive/pkg/memory/embedder/ollama"
+	memorysqlite "github.com/stacklok/toolhive/pkg/memory/sqlite"
+)
+
+const (
+	readHeaderTimeout = 10 * time.Second
+	readTimeout       = 30 * time.Second
+	// writeTimeout is intentionally long: SSE streams for MCP can be long-lived.
+	writeTimeout    = 0
+	idleTimeout     = 120 * time.Second
+	shutdownTimeout = 10 * time.Second
+)
+
+func main() {
+	cfgPath := os.Getenv("MEMORY_CONFIG")
+	if cfgPath == "" {
+		cfgPath = "/config/memory-server.yaml"
+	}
+
+	cfg, err := LoadConfig(cfgPath)
+	if err != nil {
+		log.Fatalf("loading config: %v", err)
+	}
+
+	logger, err := zap.NewProduction()
+	if err != nil {
+		log.Fatalf("creating logger: %v", err)
+	}
+	defer logger.Sync() //nolint:errcheck
+
+	ctx, cancel := signal.NotifyContext(context.Background(), syscall.SIGINT, syscall.SIGTERM)
+	defer cancel()
+
+	db, err := memorysqlite.Open(ctx, cfg.Storage.DSN)
+	if err != nil {
+		logger.Fatal("opening database", zap.Error(err))
+	}
+	defer db.Close() //nolint:errcheck
+
+	store := memorysqlite.NewStore(db)
+	vectors := memorysqlite.NewVectorStore(db)
+
+	var embedder memory.Embedder
+	switch cfg.Embedder.Provider {
+	case providerOllama:
+		embedder, err = ollama.New(cfg.Embedder.URL, cfg.Embedder.Model)
+		if err != nil {
+			logger.Fatal("creating ollama embedder", zap.Error(err))
+		}
+	default:
+		logger.Fatal("unsupported embedder provider", zap.String("provider", cfg.Embedder.Provider))
+	}
+
+	svc, err := memory.NewService(store, vectors, embedder, logger)
+	if err != nil {
+		logger.Fatal("creating memory service", zap.Error(err))
+	}
+
+	job := lifecycle.New(store, logger)
+	go job.Run(ctx, time.Duration(cfg.Server.LifecycleHours)*time.Hour)
+
+	if err := serve(ctx, cfg, svc, store, logger); err != nil {
+		logger.Error("server exited with error", zap.Error(err))
+		os.Exit(1)
+	}
+}
+
+func serve(ctx context.Context, cfg *Config, svc *memory.Service, store memory.Store, logger *zap.Logger) error {
+	addr := fmt.Sprintf("%s:%d", cfg.Server.Host, cfg.Server.Port)
+	listener, err := net.Listen("tcp", addr)
+	if err != nil {
+		return fmt.Errorf("creating listener: %w", err)
+	}
+
+	handler := newHandler(cfg, svc, store, logger)
+	httpServer := &http.Server{
+		Handler:           handler,
+		ReadHeaderTimeout: readHeaderTimeout,
+		ReadTimeout:       readTimeout,
+		WriteTimeout:      writeTimeout,
+		IdleTimeout:       idleTimeout,
+	}
+
+	errCh := make(chan error, 1)
+	go func() {
+		logger.Info("memory MCP server listening",
+			zap.String("addr", listener.Addr().String()),
+			zap.String("endpoint", mcpEndpointPath),
+		)
+		if err := httpServer.Serve(listener); err != nil && !errors.Is(err, http.ErrServerClosed) {
+			errCh <- err
+		}
+	}()
+
+	select {
+	case <-ctx.Done():
+		shutCtx, shutCancel := context.WithTimeout(context.Background(), shutdownTimeout)
+		defer shutCancel()
+		return httpServer.Shutdown(shutCtx)
+	case err := <-errCh:
+		return err
+	}
+}
diff --git a/cmd/thv-memory/server.go b/cmd/thv-memory/server.go
new file mode 100644
index 0000000000..09cf635883
--- /dev/null
+++ b/cmd/thv-memory/server.go
@@ -0,0 +1,46 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package main
+
+import (
+	"net/http"
+
+	"github.com/mark3labs/mcp-go/server"
+	"go.uber.org/zap"
+
+	"github.com/stacklok/toolhive/cmd/thv-memory/tools"
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+const mcpEndpointPath = "/mcp"
+
+// newHandler builds the MCP server, registers all memory tools, and returns an
+// http.Handler that serves the MCP streamable-HTTP transport on /mcp plus a
+// /health liveness probe.
+func newHandler(cfg *Config, svc *memory.Service, store memory.Store, log *zap.Logger) http.Handler {
+	s := server.NewMCPServer(cfg.Server.Name, cfg.Server.Version)
+
+	tools.RegisterRemember(s, svc)
+	tools.RegisterSearch(s, svc)
+	tools.RegisterRecall(s, store)
+	tools.RegisterForget(s, store)
+	tools.RegisterUpdate(s, store)
+	tools.RegisterFlag(s, store)
+	tools.RegisterList(s, store)
+	tools.RegisterConsolidate(s, svc, store)
+	tools.RegisterCrystallize(s, store)
+
+	log.Debug("registered memory MCP tools", zap.String("endpoint", mcpEndpointPath))
+
+	streamable := server.NewStreamableHTTPServer(s,
+		server.WithEndpointPath(mcpEndpointPath),
+	)
+
+	mux := http.NewServeMux()
+	mux.HandleFunc("/health", func(w http.ResponseWriter, _ *http.Request) {
+		w.WriteHeader(http.StatusOK)
+	})
+	mux.Handle("/", streamable)
+	return mux
+}
diff --git a/cmd/thv-memory/tools/consolidate.go b/cmd/thv-memory/tools/consolidate.go
new file mode 100644
index 0000000000..3d7ef11913
--- /dev/null
+++ b/cmd/thv-memory/tools/consolidate.go
@@ -0,0 +1,69 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+// Package tools registers MCP tools for the memory server.
+package tools
+
+import (
+	"context"
+	"encoding/json"
+	"fmt"
+	"strings"
+
+	"github.com/mark3labs/mcp-go/mcp"
+	"github.com/mark3labs/mcp-go/server"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// RegisterConsolidate registers the memory_consolidate tool.
+func RegisterConsolidate(s *server.MCPServer, svc *memory.Service, store memory.Store) {
+	tool := mcp.NewTool("memory_consolidate",
+		mcp.WithDescription(
+			"Merge related memory entries into one richer entry. "+
+				"Originals are archived with a pointer to the new entry.",
+		),
+		mcp.WithArray("ids", mcp.Required(), mcp.Description("Array of memory IDs to consolidate"), mcp.WithStringItems()),
+		mcp.WithString("content", mcp.Required(), mcp.Description("Content for the consolidated entry")),
+		mcp.WithString("type", mcp.Required(), mcp.Description("Memory type for the consolidated entry")),
+	)
+	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
+		ids, err := req.RequireStringSlice("ids")
+		if err != nil {
+			return mcp.NewToolResultError("ids must be an array of strings"), nil
+		}
+		if len(ids) < 2 {
+			return mcp.NewToolResultError("at least 2 ids required"), nil
+		}
+
+		content := req.GetString("content", "")
+		memTypeStr := req.GetString("type", "")
+
+		result, err := svc.Remember(ctx, memory.RememberInput{
+			Content: content,
+			Type:    memory.Type(memTypeStr),
+			Author:  memory.AuthorHuman,
+			Force:   true,
+		})
+		if err != nil {
+			return mcp.NewToolResultError(fmt.Sprintf("creating consolidated entry: %v", err)), nil
+		}
+
+		var archiveErrors []string
+		for _, id := range ids {
+			if err := store.Archive(ctx, id, memory.ArchiveReasonConsolidated, result.MemoryID); err != nil {
+				archiveErrors = append(archiveErrors, fmt.Sprintf("%s: %v", id, err))
+			}
+		}
+
+		resp := map[string]any{
+			"consolidated_id": result.MemoryID,
+			"archived_ids":    ids,
+		}
+		if len(archiveErrors) > 0 {
+			resp["archive_errors"] = strings.Join(archiveErrors, "; ")
+		}
+		out, _ := json.Marshal(resp)
+		return mcp.NewToolResultText(string(out)), nil
+	})
+}
diff --git a/cmd/thv-memory/tools/crystallize.go b/cmd/thv-memory/tools/crystallize.go
new file mode 100644
index 0000000000..e7318a8127
--- /dev/null
+++ b/cmd/thv-memory/tools/crystallize.go
@@ -0,0 +1,74 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package tools
+
+import (
+	"context"
+	"encoding/json"
+	"fmt"
+	"strings"
+
+	"github.com/mark3labs/mcp-go/mcp"
+	"github.com/mark3labs/mcp-go/server"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// RegisterCrystallize registers the memory_crystallize tool.
+func RegisterCrystallize(s *server.MCPServer, store memory.Store) {
+	tool := mcp.NewTool("memory_crystallize",
+		mcp.WithDescription("Generate a SKILL.md scaffold from procedural memory entries for human review and publishing."),
+		mcp.WithArray("ids", mcp.Required(), mcp.Description("Array of procedural memory IDs"), mcp.WithStringItems()),
+		mcp.WithString("name", mcp.Required(), mcp.Description("Proposed skill name (kebab-case)")),
+	)
+	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
+		ids, err := req.RequireStringSlice("ids")
+		if err != nil {
+			return mcp.NewToolResultError("ids must be an array of strings"), nil
+		}
+		name := req.GetString("name", "")
+
+		var contents []string
+		for _, id := range ids {
+			entry, err := store.Get(ctx, id)
+			if err != nil {
+				continue
+			}
+			contents = append(contents, entry.Content)
+		}
+		if len(contents) == 0 {
+			return mcp.NewToolResultError("no valid entries found"), nil
+		}
+
+		scaffold := buildSkillScaffold(name, contents)
+		out, _ := json.Marshal(map[string]string{
+			"skill_name": name,
+			"skill_md":   scaffold,
+			"note":       "Review this scaffold, edit as needed, then publish with: thv skills push " + name,
+		})
+		return mcp.NewToolResultText(string(out)), nil
+	})
+}
+
+func buildSkillScaffold(name string, contents []string) string {
+	return fmt.Sprintf(`---
+name: %s
+description: "[TODO: one-line description of what this skill does]"
+---
+
+# %s
+
+## Context
+
+This skill was crystallized from %d procedural memory entries.
+
+## Guidance
+
+%s
+
+## When to Use
+
+[TODO: describe when an agent should apply this skill]
+`, name, name, len(contents), "- "+strings.Join(contents, "\n- "))
+}
diff --git a/cmd/thv-memory/tools/flag.go b/cmd/thv-memory/tools/flag.go
new file mode 100644
index 0000000000..e7e648e74c
--- /dev/null
+++ b/cmd/thv-memory/tools/flag.go
@@ -0,0 +1,30 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package tools
+
+import (
+	"context"
+
+	"github.com/mark3labs/mcp-go/mcp"
+	"github.com/mark3labs/mcp-go/server"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// RegisterFlag registers the memory_flag tool.
+func RegisterFlag(s *server.MCPServer, store memory.Store) {
+	tool := mcp.NewTool("memory_flag",
+		mcp.WithDescription("Mark a memory as potentially stale without deleting it."),
+		mcp.WithString("id", mcp.Required(), mcp.Description("Memory entry ID")),
+		mcp.WithString("reason", mcp.Required(), mcp.Description("Why this memory may be stale")),
+	)
+	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
+		id := req.GetString("id", "")
+		reason := req.GetString("reason", "")
+		if err := store.Flag(ctx, id, reason); err != nil {
+			return mcp.NewToolResultError(err.Error()), nil
+		}
+		return mcp.NewToolResultText(`{"status":"ok"}`), nil
+	})
+}
diff --git a/cmd/thv-memory/tools/forget.go b/cmd/thv-memory/tools/forget.go
new file mode 100644
index 0000000000..8ea8c27dee
--- /dev/null
+++ b/cmd/thv-memory/tools/forget.go
@@ -0,0 +1,28 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package tools
+
+import (
+	"context"
+
+	"github.com/mark3labs/mcp-go/mcp"
+	"github.com/mark3labs/mcp-go/server"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// RegisterForget registers the memory_forget tool.
+func RegisterForget(s *server.MCPServer, store memory.Store) {
+	tool := mcp.NewTool("memory_forget",
+		mcp.WithDescription("Delete a memory entry permanently."),
+		mcp.WithString("id", mcp.Required(), mcp.Description("Memory entry ID")),
+	)
+	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
+		id := req.GetString("id", "")
+		if err := store.Delete(ctx, id); err != nil {
+			return mcp.NewToolResultError(err.Error()), nil
+		}
+		return mcp.NewToolResultText(`{"status":"ok"}`), nil
+	})
+}
diff --git a/cmd/thv-memory/tools/list.go b/cmd/thv-memory/tools/list.go
new file mode 100644
index 0000000000..b813dc4a18
--- /dev/null
+++ b/cmd/thv-memory/tools/list.go
@@ -0,0 +1,47 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package tools
+
+import (
+	"context"
+	"encoding/json"
+
+	"github.com/mark3labs/mcp-go/mcp"
+	"github.com/mark3labs/mcp-go/server"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// RegisterList registers the memory_list tool.
+func RegisterList(s *server.MCPServer, store memory.Store) {
+	tool := mcp.NewTool("memory_list",
+		mcp.WithDescription("List memory entries with structured filters (not semantic). Use memory_search for semantic queries."),
+		mcp.WithString("type", mcp.Description("Filter by type: semantic or procedural")),
+		mcp.WithString("author", mcp.Description("Filter by author: human or agent")),
+		mcp.WithNumber("limit", mcp.Description("Max results (default 20)")),
+		mcp.WithNumber("offset", mcp.Description("Pagination offset")),
+	)
+	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
+		var f memory.ListFilter
+		if rawType := req.GetString("type", ""); rawType != "" {
+			t := memory.Type(rawType)
+			f.Type = &t
+		}
+		if rawAuthor := req.GetString("author", ""); rawAuthor != "" {
+			a := memory.AuthorType(rawAuthor)
+			f.Author = &a
+		}
+		f.Limit = req.GetInt("limit", 20)
+		f.Offset = req.GetInt("offset", 0)
+		active := memory.EntryStatusActive
+		f.Status = &active
+
+		entries, err := store.List(ctx, f)
+		if err != nil {
+			return mcp.NewToolResultError(err.Error()), nil
+		}
+		out, _ := json.Marshal(entries)
+		return mcp.NewToolResultText(string(out)), nil
+	})
+}
diff --git a/cmd/thv-memory/tools/recall.go b/cmd/thv-memory/tools/recall.go
new file mode 100644
index 0000000000..f4e52ccf21
--- /dev/null
+++ b/cmd/thv-memory/tools/recall.go
@@ -0,0 +1,36 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package tools
+
+import (
+	"context"
+	"encoding/json"
+	"errors"
+
+	"github.com/mark3labs/mcp-go/mcp"
+	"github.com/mark3labs/mcp-go/server"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// RegisterRecall registers the memory_recall tool.
+func RegisterRecall(s *server.MCPServer, store memory.Store) {
+	tool := mcp.NewTool("memory_recall",
+		mcp.WithDescription("Fetch a specific memory entry by ID, including its full revision history."),
+		mcp.WithString("id", mcp.Required(), mcp.Description("Memory entry ID")),
+	)
+	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
+		id := req.GetString("id", "")
+		entry, err := store.Get(ctx, id)
+		if err != nil {
+			if errors.Is(err, memory.ErrNotFound) {
+				return mcp.NewToolResultError("entry not found"), nil
+			}
+			return mcp.NewToolResultError(err.Error()), nil
+		}
+		_ = store.IncrementAccess(ctx, id)
+		out, _ := json.Marshal(entry)
+		return mcp.NewToolResultText(string(out)), nil
+	})
+}
diff --git a/cmd/thv-memory/tools/remember.go b/cmd/thv-memory/tools/remember.go
new file mode 100644
index 0000000000..58bb332b3c
--- /dev/null
+++ b/cmd/thv-memory/tools/remember.go
@@ -0,0 +1,58 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package tools
+
+import (
+	"context"
+	"encoding/json"
+
+	"github.com/mark3labs/mcp-go/mcp"
+	"github.com/mark3labs/mcp-go/server"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// RegisterRemember registers the memory_remember tool.
+func RegisterRemember(s *server.MCPServer, svc *memory.Service) {
+	tool := mcp.NewTool("memory_remember",
+		mcp.WithDescription("Store a new semantic or procedural memory. Returns conflict_detected if a similar memory exists."),
+		mcp.WithString("content", mcp.Required(), mcp.Description("The knowledge to store")),
+		mcp.WithString("type", mcp.Required(), mcp.Description("Memory type: semantic or procedural")),
+		mcp.WithString("author", mcp.Description("Author type: human or agent (default: agent)")),
+		mcp.WithString("session_id", mcp.Description("Originating session ID")),
+		mcp.WithNumber("ttl_days", mcp.Description("Optional TTL in days")),
+		mcp.WithBoolean("force", mcp.Description("Write even if conflicts detected")),
+	)
+	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
+		content := req.GetString("content", "")
+		memTypeStr := req.GetString("type", "")
+		authorStr := req.GetString("author", "agent")
+		if authorStr == "" {
+			authorStr = "agent"
+		}
+		force := req.GetBool("force", false)
+		sessionID := req.GetString("session_id", "")
+
+		var ttlDays *int
+		args := req.GetArguments()
+		if raw, ok := args["ttl_days"].(float64); ok {
+			v := int(raw)
+			ttlDays = &v
+		}
+
+		result, err := svc.Remember(ctx, memory.RememberInput{
+			Content:   content,
+			Type:      memory.Type(memTypeStr),
+			Author:    memory.AuthorType(authorStr),
+			SessionID: sessionID,
+			TTLDays:   ttlDays,
+			Force:     force,
+		})
+		if err != nil {
+			return mcp.NewToolResultError(err.Error()), nil
+		}
+		out, _ := json.Marshal(result)
+		return mcp.NewToolResultText(string(out)), nil
+	})
+}
diff --git a/cmd/thv-memory/tools/search.go b/cmd/thv-memory/tools/search.go
new file mode 100644
index 0000000000..9de39e0144
--- /dev/null
+++ b/cmd/thv-memory/tools/search.go
@@ -0,0 +1,45 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package tools
+
+import (
+	"context"
+	"encoding/json"
+
+	"github.com/mark3labs/mcp-go/mcp"
+	"github.com/mark3labs/mcp-go/server"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// RegisterSearch registers the memory_search tool.
+func RegisterSearch(s *server.MCPServer, svc *memory.Service) {
+	tool := mcp.NewTool("memory_search",
+		mcp.WithDescription(
+			"Semantic search across memory entries. "+
+				"Returns entries ranked by similarity with trust and staleness scores.",
+		),
+		mcp.WithString("query", mcp.Required(), mcp.Description("Natural language query")),
+		mcp.WithString("type", mcp.Description("Filter by type: semantic or procedural")),
+		mcp.WithNumber("top_k", mcp.Description("Maximum results to return (default 10)")),
+	)
+	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
+		query := req.GetString("query", "")
+
+		var memType *memory.Type
+		if rawType := req.GetString("type", ""); rawType != "" {
+			t := memory.Type(rawType)
+			memType = &t
+		}
+
+		topK := req.GetInt("top_k", 10)
+
+		results, err := svc.Search(ctx, query, memType, topK)
+		if err != nil {
+			return mcp.NewToolResultError(err.Error()), nil
+		}
+		out, _ := json.Marshal(results)
+		return mcp.NewToolResultText(string(out)), nil
+	})
+}
diff --git a/cmd/thv-memory/tools/update.go b/cmd/thv-memory/tools/update.go
new file mode 100644
index 0000000000..c2925f6618
--- /dev/null
+++ b/cmd/thv-memory/tools/update.go
@@ -0,0 +1,44 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package tools
+
+import (
+	"context"
+	"encoding/json"
+
+	"github.com/mark3labs/mcp-go/mcp"
+	"github.com/mark3labs/mcp-go/server"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// RegisterUpdate registers the memory_update tool.
+func RegisterUpdate(s *server.MCPServer, store memory.Store) {
+	tool := mcp.NewTool("memory_update",
+		mcp.WithDescription("Correct or refine an existing memory entry. Previous content is saved to history."),
+		mcp.WithString("id", mcp.Required(), mcp.Description("Memory entry ID")),
+		mcp.WithString("content", mcp.Required(), mcp.Description("Updated content")),
+		mcp.WithString("author", mcp.Description("Author type: human or agent (default: agent)")),
+		mcp.WithString("correction_note", mcp.Description("Explanation for the correction")),
+	)
+	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
+		id := req.GetString("id", "")
+		content := req.GetString("content", "")
+		authorStr := req.GetString("author", "agent")
+		if authorStr == "" {
+			authorStr = "agent"
+		}
+		note := req.GetString("correction_note", "")
+
+		if err := store.Update(ctx, id, content, memory.AuthorType(authorStr), note); err != nil {
+			return mcp.NewToolResultError(err.Error()), nil
+		}
+		entry, err := store.Get(ctx, id)
+		if err != nil {
+			return mcp.NewToolResultError(err.Error()), nil
+		}
+		out, _ := json.Marshal(entry)
+		return mcp.NewToolResultText(string(out)), nil
+	})
+}

From a7fa58c7448c2b8df6c669a19893856fc973143d Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Wed, 22 Apr 2026 10:56:49 -0400
Subject: [PATCH 05/23] Document shared memory server design and activation
 strategy

Covers architecture, MCP tool surface, trust/staleness scoring,
conflict detection, Skills relationship, a comparison with LinkedIn's
Cognitive Memory Agent, and the recommended three-tier memory activation
strategy (session-boundary injection, signal-based mid-session reads,
write-on-observation).

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 .../2026-04-22-shared-memory-server.md        | 312 ++++++++++++++++++
 1 file changed, 312 insertions(+)
 create mode 100644 docs/proposals/2026-04-22-shared-memory-server.md

diff --git a/docs/proposals/2026-04-22-shared-memory-server.md b/docs/proposals/2026-04-22-shared-memory-server.md
new file mode 100644
index 0000000000..899d7b15e1
--- /dev/null
+++ b/docs/proposals/2026-04-22-shared-memory-server.md
@@ -0,0 +1,312 @@
+# Shared Long-Term Memory Server
+
+**Date:** 2026-04-22
+**Status:** Implementation in progress (Plan 1 of 3 complete)
+
+---
+
+## Problem
+
+ToolHive manages MCPs (tools) and Skills (procedural knowledge as OCI artifacts). The missing
+primitive is **shared long-term memory**: a team-wide knowledge store that agents can query and
+contribute to across sessions.
+
+Without it, every agent session starts cold. Facts learned by one agent are invisible to others.
+Patterns that emerge from repeated interactions are lost when the session ends.
+
+---
+
+## Memory Types
+
+Two long-term memory namespaces are in scope:
+
+| Type | Purpose | Example |
+|---|---|---|
+| `semantic` | Aggregated facts and world-state knowledge | "Company does not sponsor visas" |
+| `procedural` | How-to knowledge, heuristics, SOPs | "Always run `task lint-fix` before committing" |
+| `episodic` | Time-indexed event records | "Recruiter archived candidate on 2024-03-15 — visa required" |
+
+**Out of scope:** working memory and conversational memory — agents handle those internally via
+their context window.
+
+---
+
+## Architecture
+
+### System Workload
+
+The memory server is ToolHive's first **system workload** — a managed MCP server auto-provisioned
+by ToolHive rather than explicitly started by users. Key properties:
+
+- Auto-provisioned on first use (`thv memory init`)
+- Persistent — excluded from `thv stop --all`
+- Singleton per scope (one per team in `thv serve` mode)
+- Registered in the registry under the reserved name `toolhive.memory`
+
+### Transport
+
+The memory server uses **MCP streamable HTTP** transport (not stdio). Agents connect via
+`http://<host>:8080/mcp`. A `/health` liveness probe is available at the same host.
+
+### Pluggable Backends
+
+Three independent interfaces, configured via `memory-server.yaml`:
+
+```yaml
+storage:
+  provider: sqlite          # sqlite (default) | postgres | mongodb
+  dsn: /data/memory.db
+
+vector:
+  provider: sqlite-vec      # sqlite-vec (default) | qdrant | pgvector
+  url: ""
+
+embedder:
+  provider: ollama          # ollama (default) | openai | cohere
+  model: nomic-embed-text
+  url: http://localhost:11434
+
+server:
+  host: 0.0.0.0
+  port: 8080
+  lifecycle_interval_hours: 24
+```
+
+Zero-infra teams use SQLite defaults with no external dependencies. Teams with Postgres can
+collapse both storage and vector into pgvector.
+
+### Deployment Modes
+
+**Local (`thv` CLI):** Personal memory, local container, SQLite defaults.
+
+**Team (`thv serve`):** Shared instance; all team agents connect via the API server proxy.
+Auth enforced via existing OIDC middleware.
+
+**Kubernetes (`thv-operator`):** New `MCPMemoryServer` CRD (Plan 3). Operator reconciles to
+`Deployment + Service + PVC`.
+
+---
+
+## MCP Tool Surface
+
+Agents consume memory exactly like any other MCP — no special integration.
+
+| Tool | Description |
+|---|---|
+| `memory_remember` | Write a memory. Runs conflict detection; returns conflicts if similarity > 0.85 |
+| `memory_search` | Semantic vector search, results ranked by composite trust+staleness score |
+| `memory_recall` | Fetch a specific entry by ID, including full revision history |
+| `memory_forget` | Delete a memory |
+| `memory_update` | Correct content; previous version saved to revision history |
+| `memory_flag` | Mark as potentially stale without deleting |
+| `memory_list` | Structured listing with filters: type, author, tags, time-range |
+| `memory_consolidate` | Merge related entries; originals archived with pointer |
+| `memory_crystallize` | Promote procedural memories to a Skill scaffold for human authoring |
+
+### Conflict Detection
+
+On `memory_remember`, the server embeds the new content and searches for similar active entries.
+If any entry has cosine similarity > 0.85, the write is blocked and the agent receives a
+`conflict_detected` response with the conflicting entries. The agent decides: force-write,
+update the existing entry, or abort. No LLM inference — the agent (which has context) is better
+placed to judge whether two similar entries actually conflict.
+
+### Search Ranking
+
+`memory_search` returns results ranked by a composite score that combines vector similarity with
+the entry's trust and staleness signals:
+
+```
+composite = similarity × trust_score × (1 - 0.3 × staleness_score)
+```
+
+This prevents a high-similarity but flagged or stale entry from ranking above a fresher,
+more trusted one.
+
+---
+
+## Trust and Staleness Scoring
+
+### Trust Score
+
+```
+trust_score = author_weight
+            × age_decay(created_at, half_life=180d)
+            × (1 - min(corrections × 0.05, 0.30))
+            × (0.5 if flagged else 1.0)
+
+author_weight: human=1.0, agent=0.7
+```
+
+### Staleness Score
+
+```
+staleness_score = normalize(days_since_last_access, max=90d)
+                + (0.3 if flagged)
+                + min(corrections × 0.1, 0.3)
+```
+
+Entries with `staleness_score > 0.8` surface in the lifecycle audit log every 24 hours.
+
+---
+
+## Skills Relationship
+
+Skills (existing) and procedural memory are the same kind of knowledge at different stages of
+maturity:
+
+```
+Agent/human observes something
+         │
+         ▼
+  Procedural Memory          ← fluid, emergent, evolving
+  (memory server)
+         │
+    (patterns emerge,
+     human crystallizes)
+         │
+         ▼
+      Skill (OCI)            ← crystallized, versioned, distributed
+  (existing skills system)
+```
+
+`memory_crystallize` bridges the gap: it takes stable procedural memory entries and produces a
+`SKILL.md` scaffold for a human to author and push via `thv skills push`. The source entries are
+archived with a `crystallized_into` pointer so search returns the canonical Skill instead.
+
+---
+
+## Recommended Memory Activation Strategy
+
+Not every agent interaction should touch the memory server. The recommended approach is a
+three-tier strategy:
+
+### Tier 1 — Session-boundary injection (always)
+
+At the **start** of every task-bearing session, the system prompt instructs the agent to run one
+`memory_search` call with the task description before doing anything else. This is silent,
+cheap (one vector search), and covers the most valuable case: cross-session continuity.
+
+```
+Before starting work, call memory_search with the task description to load
+relevant team knowledge. Do this once, silently — do not explain it to the user.
+```
+
+At the **end** of a session, the agent writes what was discovered or decided that would be
+useful to a different agent in a future session.
+
+### Tier 2 — Signal-based mid-session reads (agent-decided)
+
+The system prompt instructs the agent to call `memory_search` when it encounters:
+
+1. **Uncertainty** — "I don't have enough context to answer this confidently"
+2. **Cross-session references** — phrases like "last time", "previously", "we decided",
+   "our policy", "do you remember"
+3. **Team-specific facts** — questions about preferences, conventions, or domain knowledge
+   not in the codebase or current context
+
+### Tier 3 — Write on observation, not speculation
+
+The agent calls `memory_remember` only for facts that:
+- Were not already in the search results from Tier 1
+- Would be useful to a **different** agent in a **future** session
+
+The system prompt guidance:
+
+```
+Write a memory when you learn something that:
+- corrects or refines an existing fact (use memory_update instead)
+- is a team decision, constraint, or policy that will apply again
+- is a recurring pattern observed more than once
+
+Do NOT write memories for facts already in the codebase, documentation,
+or the current conversation context.
+```
+
+### Why not automatic ingestion?
+
+Auto-ingestion (LinkedIn's streaming pipeline approach) requires:
+- An LLM call in the ingestion path to extract facts from raw transcripts
+- Quality control to decide what is worth persisting
+- Evaluation tooling to measure ingestion accuracy
+
+These are deferred to a later plan. The explicit tool-use model is more predictable and
+debuggable for a v1, and the agent (which has full context) makes better judgments about
+what is worth writing than a pipeline operating on raw text.
+
+---
+
+## Comparison with LinkedIn's Cognitive Memory Agent
+
+LinkedIn's CMA (described in their [engineering blog](https://www.linkedin.com/blog/engineering/ai/the-linkedin-generative-ai-application-tech-stack-personalization-with-cognitive-memory-agent))
+is the closest public reference. Key differences:
+
+| Dimension | LinkedIn CMA | ToolHive Memory |
+|---|---|---|
+| Conflict detection | On roadmap | Implemented (cosine > 0.85) |
+| Trust/staleness scoring | Time-based prioritization planned | Implemented (full formula + background job) |
+| User control (list/update/delete/flag) | On roadmap | Implemented |
+| Search ranking | Implicit | Composite score: similarity × trust × (1 − staleness penalty) |
+| Episodic memory type | Distinct tier | `TypeEpisodic` with time-range `ListFilter` |
+| Retrieval orchestration | LLM-powered multi-step planner | Agent calls tools directly (agent IS the orchestrator) |
+| Hierarchical aggregation | Auto tree: events → summaries → facets | Explicit: `memory_consolidate` + `memory_crystallize` |
+| Tenant isolation | Per-application isolated stores | Auth at proxy layer; storage-level namespace deferred |
+| Auto ingestion pipeline | Streaming + batch LLM extraction | Deferred; `memory_distill` returns candidates for agent review |
+
+---
+
+## Implementation Status
+
+### Plan 1 — Memory server core (this branch)
+
+- [x] `pkg/memory/` — domain types, interfaces (`Store`, `VectorStore`, `Embedder`), scoring, service
+- [x] `pkg/memory/sqlite/` — SQLite Store + VectorStore (Go cosine similarity, no CGo)
+- [x] `pkg/memory/embedder/ollama/` — Ollama HTTP embedder
+- [x] `pkg/memory/mocks/` — gomock mocks for all three interfaces
+- [x] `cmd/thv-memory/` — MCP server binary (streamable HTTP on `/mcp`)
+- [x] `cmd/thv-memory/lifecycle/` — 24h background job (TTL expiry, score recomputation)
+- [x] `cmd/thv-memory/tools/` — 9 MCP tool handlers
+- [x] Integration test (SQLite + fake embedder, end-to-end remember → search → delete)
+
+### Plan 2 — CLI + system workload integration (not started)
+
+- `thv memory` subcommand tree
+- System workload auto-provisioning (`thv memory init`)
+- Registry integration under `toolhive.memory`
+
+### Plan 3 — Kubernetes operator (not started)
+
+- `MCPMemoryServer` CRD
+- Operator controller: reconciles to `Deployment + Service + PVC`
+- `MCPRegistry` integration
+
+---
+
+## Package Layout
+
+```
+pkg/memory/
+├── types.go          — Entry, Revision, ListFilter, VectorFilter, scoring types
+├── interfaces.go     — Store, VectorStore, Embedder interfaces + mockgen directives
+├── service.go        — Orchestration: conflict detection, remember, search
+├── scoring.go        — ComputeTrustScore, ComputeStalenessScore
+├── errors.go         — ErrNotFound
+├── mocks/            — Generated gomock mocks
+├── sqlite/
+│   ├── db.go         — DB wrapper, WAL pragmas, goose migrations
+│   ├── store.go      — Store implementation
+│   ├── vector.go     — VectorStore implementation (Go cosine similarity)
+│   └── migrations/   — goose SQL migrations
+└── embedder/
+    └── ollama/       — Ollama HTTP embedder
+
+cmd/thv-memory/
+├── main.go           — Entry point, HTTP server lifecycle
+├── server.go         — MCP server construction, tool registration, HTTP handler
+├── config.go         — YAML config with defaults
+├── lifecycle/
+│   └── job.go        — Background maintenance job
+└── tools/            — One file per MCP tool
+    ├── remember.go, search.go, recall.go, forget.go, update.go
+    ├── flag.go, list.go, consolidate.go, crystallize.go
+```

From f8e4c92376d2198decc601f8e3fd032237bd784b Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Fri, 24 Apr 2026 11:23:00 -0400
Subject: [PATCH 06/23] Add static resource entries with management REST API
 and MCP Resources sync

UI-managed resource entries (source=resource) are stored in the database and
exposed read-only to agents via MCP Resources protocol. The management REST
API (/api/resources) lets the UI create, update, and delete resources; the MCP
server is kept in sync so agents receive list_changed notifications and can
discover new content progressively through memory_search or resources/list.

- Add SourceResource type and ErrReadOnly sentinel; protect tool layer from
  mutating skill/resource entries (forget, update, flag)
- Extend VectorFilter with Source field so search can scope to resources
- Add management REST API package (cmd/thv-memory/resources/api.go) wired via
  closure injection to avoid circular imports with package main
- Refactor server.go: split newMCPServer / newHandler, add RegisterResourceEntry
  / UnregisterResourceEntry helpers, LoadExistingResources at startup
- Switch HTTP handler to streamable-HTTP transport (NewStreamableHTTPServer)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 cmd/thv-memory/main.go          |  29 ++-
 cmd/thv-memory/resources/api.go | 327 ++++++++++++++++++++++++++++++++
 cmd/thv-memory/server.go        | 119 +++++++++++-
 cmd/thv-memory/tools/flag.go    |   3 +
 cmd/thv-memory/tools/forget.go  |   3 +
 cmd/thv-memory/tools/helpers.go |  25 +++
 cmd/thv-memory/tools/update.go  |   3 +
 pkg/memory/errors.go            |   5 +
 pkg/memory/sqlite/vector.go     |   4 +
 pkg/memory/types.go             |   6 +
 10 files changed, 513 insertions(+), 11 deletions(-)
 create mode 100644 cmd/thv-memory/resources/api.go
 create mode 100644 cmd/thv-memory/tools/helpers.go

diff --git a/cmd/thv-memory/main.go b/cmd/thv-memory/main.go
index e4ed9d023d..52704b3f3a 100644
--- a/cmd/thv-memory/main.go
+++ b/cmd/thv-memory/main.go
@@ -15,9 +15,11 @@ import (
 	"syscall"
 	"time"
 
+	mcpserver "github.com/mark3labs/mcp-go/server"
 	"go.uber.org/zap"
 
 	"github.com/stacklok/toolhive/cmd/thv-memory/lifecycle"
+	"github.com/stacklok/toolhive/cmd/thv-memory/resources"
 	"github.com/stacklok/toolhive/pkg/memory"
 	"github.com/stacklok/toolhive/pkg/memory/embedder/ollama"
 	memorysqlite "github.com/stacklok/toolhive/pkg/memory/sqlite"
@@ -26,7 +28,7 @@ import (
 const (
 	readHeaderTimeout = 10 * time.Second
 	readTimeout       = 30 * time.Second
-	// writeTimeout is intentionally long: SSE streams for MCP can be long-lived.
+	// writeTimeout is intentionally zero: SSE streams for MCP can be long-lived.
 	writeTimeout    = 0
 	idleTimeout     = 120 * time.Second
 	shutdownTimeout = 10 * time.Second
@@ -80,20 +82,36 @@ func main() {
 	job := lifecycle.New(store, logger)
 	go job.Run(ctx, time.Duration(cfg.Server.LifecycleHours)*time.Hour)
 
-	if err := serve(ctx, cfg, svc, store, logger); err != nil {
+	s := newMCPServer(cfg, svc, store)
+	LoadExistingResources(ctx, s, store, logger)
+
+	resourceAPI := resources.NewHandler(
+		store, vectors, embedder,
+		func(e memory.Entry) { RegisterResourceEntry(s, store, e) },
+		func(id string) { UnregisterResourceEntry(s, id) },
+		logger,
+	)
+
+	if err := serve(ctx, cfg, s, resourceAPI, logger); err != nil {
 		logger.Error("server exited with error", zap.Error(err))
 		os.Exit(1)
 	}
 }
 
-func serve(ctx context.Context, cfg *Config, svc *memory.Service, store memory.Store, logger *zap.Logger) error {
+func serve(
+	ctx context.Context,
+	cfg *Config,
+	s *mcpserver.MCPServer,
+	resourceAPI http.Handler,
+	logger *zap.Logger,
+) error {
 	addr := fmt.Sprintf("%s:%d", cfg.Server.Host, cfg.Server.Port)
 	listener, err := net.Listen("tcp", addr)
 	if err != nil {
 		return fmt.Errorf("creating listener: %w", err)
 	}
 
-	handler := newHandler(cfg, svc, store, logger)
+	handler := newHandler(s, resourceAPI, logger)
 	httpServer := &http.Server{
 		Handler:           handler,
 		ReadHeaderTimeout: readHeaderTimeout,
@@ -106,7 +124,8 @@ func serve(ctx context.Context, cfg *Config, svc *memory.Service, store memory.S
 	go func() {
 		logger.Info("memory MCP server listening",
 			zap.String("addr", listener.Addr().String()),
-			zap.String("endpoint", mcpEndpointPath),
+			zap.String("mcp_endpoint", mcpEndpointPath),
+			zap.String("resource_api", "/api/resources"),
 		)
 		if err := httpServer.Serve(listener); err != nil && !errors.Is(err, http.ErrServerClosed) {
 			errCh <- err
diff --git a/cmd/thv-memory/resources/api.go b/cmd/thv-memory/resources/api.go
new file mode 100644
index 0000000000..94fa20277e
--- /dev/null
+++ b/cmd/thv-memory/resources/api.go
@@ -0,0 +1,327 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+// Package resources provides the management REST API for UI-managed resource
+// entries. Resource entries are stored as memory.Entry values with
+// source=resource and are read-only to agents via MCP tools.
+//
+// Routes (all under /api/resources):
+//
+//	POST   /api/resources         — create resource, embed content, register in MCP
+//	GET    /api/resources         — list resources (paginated via ?limit=&offset=)
+//	GET    /api/resources/{id}    — get single resource
+//	PUT    /api/resources/{id}    — update content (re-embeds), update MCP listing
+//	DELETE /api/resources/{id}    — delete resource, unregister from MCP
+package resources
+
+import (
+	"context"
+	"encoding/json"
+	"errors"
+	"fmt"
+	"net/http"
+	"strconv"
+	"strings"
+	"time"
+
+	"github.com/google/uuid"
+	"go.uber.org/zap"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+const (
+	defaultListLimit = 50
+	maxListLimit     = 200
+)
+
+// Handler is the management REST API handler for resource entries.
+//
+// registerFn and unregisterFn are injected by the caller (package main) so
+// that the resources package does not import the MCP server package directly.
+// They keep the MCP resource listing in sync with the database: registerFn is
+// called after a create or update, unregisterFn after a delete.
+type Handler struct {
+	store        memory.Store
+	vectors      memory.VectorStore
+	embedder     memory.Embedder
+	registerFn   func(memory.Entry)
+	unregisterFn func(id string)
+	log          *zap.Logger
+}
+
+// NewHandler creates a new resource management Handler.
+//
+// registerFn and unregisterFn are the package-level MCP sync helpers from
+// server.go (RegisterResourceEntry / UnregisterResourceEntry), wrapped as
+// closures so this package does not need to import the MCP server package.
+func NewHandler(
+	store memory.Store,
+	vectors memory.VectorStore,
+	embedder memory.Embedder,
+	registerFn func(memory.Entry),
+	unregisterFn func(id string),
+	log *zap.Logger,
+) *Handler {
+	return &Handler{
+		store:        store,
+		vectors:      vectors,
+		embedder:     embedder,
+		registerFn:   registerFn,
+		unregisterFn: unregisterFn,
+		log:          log,
+	}
+}
+
+// ServeHTTP routes /api/resources requests.
+func (h *Handler) ServeHTTP(w http.ResponseWriter, r *http.Request) {
+	// Strip /api/resources prefix to get the remaining path.
+	path := strings.TrimPrefix(r.URL.Path, "/api/resources")
+	path = strings.TrimPrefix(path, "/")
+
+	switch {
+	case path == "" && r.Method == http.MethodPost:
+		h.create(w, r)
+	case path == "" && r.Method == http.MethodGet:
+		h.list(w, r)
+	case path != "" && r.Method == http.MethodGet:
+		h.get(w, r, path)
+	case path != "" && r.Method == http.MethodPut:
+		h.update(w, r, path)
+	case path != "" && r.Method == http.MethodDelete:
+		h.delete(w, r, path)
+	default:
+		http.Error(w, "method not allowed", http.StatusMethodNotAllowed)
+	}
+}
+
+// CreateResourceRequest is the payload for POST /api/resources.
+type CreateResourceRequest struct {
+	Content string   `json:"content"`
+	Type    string   `json:"type"` // semantic | procedural | episodic (default: semantic)
+	Tags    []string `json:"tags"`
+}
+
+// UpdateResourceRequest is the payload for PUT /api/resources/{id}.
+type UpdateResourceRequest struct {
+	Content string   `json:"content"`
+	Tags    []string `json:"tags"`
+}
+
+// ResourceResponse is the API representation of a resource entry.
+type ResourceResponse struct {
+	ID        string    `json:"id"`
+	Content   string    `json:"content"`
+	Type      string    `json:"type"`
+	Tags      []string  `json:"tags"`
+	CreatedAt time.Time `json:"created_at"`
+	UpdatedAt time.Time `json:"updated_at"`
+}
+
+func entryToResponse(e memory.Entry) ResourceResponse {
+	return ResourceResponse{
+		ID:        e.ID,
+		Content:   e.Content,
+		Type:      string(e.Type),
+		Tags:      e.Tags,
+		CreatedAt: e.CreatedAt,
+		UpdatedAt: e.UpdatedAt,
+	}
+}
+
+func (h *Handler) create(w http.ResponseWriter, r *http.Request) {
+	var req CreateResourceRequest
+	if err := json.NewDecoder(r.Body).Decode(&req); err != nil {
+		http.Error(w, "invalid request body", http.StatusBadRequest)
+		return
+	}
+	if strings.TrimSpace(req.Content) == "" {
+		http.Error(w, "content is required", http.StatusBadRequest)
+		return
+	}
+
+	memType := memory.TypeSemantic
+	if req.Type != "" {
+		memType = memory.Type(req.Type)
+	}
+
+	id := "res_" + uuid.New().String()
+	now := time.Now().UTC()
+	entry := memory.Entry{
+		ID:         id,
+		Type:       memType,
+		Content:    req.Content,
+		Tags:       req.Tags,
+		Author:     memory.AuthorHuman,
+		Source:     memory.SourceResource,
+		Status:     memory.EntryStatusActive,
+		TrustScore: 1.0, // resources are always fully trusted
+		CreatedAt:  now,
+		UpdatedAt:  now,
+	}
+
+	if err := h.store.Create(r.Context(), entry); err != nil {
+		h.jsonError(w, fmt.Errorf("creating entry: %w", err))
+		return
+	}
+
+	embedding, err := h.embed(r.Context(), req.Content)
+	if err != nil {
+		_ = h.store.Delete(r.Context(), id) // rollback
+		h.jsonError(w, fmt.Errorf("embedding content: %w", err))
+		return
+	}
+	if err := h.vectors.Upsert(r.Context(), id, embedding); err != nil {
+		_ = h.store.Delete(r.Context(), id) // rollback
+		h.jsonError(w, fmt.Errorf("storing embedding: %w", err))
+		return
+	}
+
+	h.registerFn(entry)
+
+	w.Header().Set("Content-Type", "application/json")
+	w.WriteHeader(http.StatusCreated)
+	_ = json.NewEncoder(w).Encode(entryToResponse(entry))
+}
+
+func (h *Handler) list(w http.ResponseWriter, r *http.Request) {
+	limit, offset := parsePagination(r)
+	src := memory.SourceResource
+	entries, err := h.store.List(r.Context(), memory.ListFilter{
+		Source: &src,
+		Limit:  limit,
+		Offset: offset,
+	})
+	if err != nil {
+		h.jsonError(w, err)
+		return
+	}
+
+	resp := make([]ResourceResponse, 0, len(entries))
+	for _, e := range entries {
+		resp = append(resp, entryToResponse(e))
+	}
+	jsonOK(w, resp)
+}
+
+func (h *Handler) get(w http.ResponseWriter, r *http.Request, id string) {
+	entry, err := h.store.Get(r.Context(), id)
+	if err != nil {
+		if errors.Is(err, memory.ErrNotFound) {
+			http.Error(w, "not found", http.StatusNotFound)
+			return
+		}
+		h.jsonError(w, err)
+		return
+	}
+	if entry.Source != memory.SourceResource {
+		http.Error(w, "not a resource entry", http.StatusNotFound)
+		return
+	}
+	jsonOK(w, entryToResponse(entry))
+}
+
+func (h *Handler) update(w http.ResponseWriter, r *http.Request, id string) {
+	entry, err := h.store.Get(r.Context(), id)
+	if err != nil {
+		if errors.Is(err, memory.ErrNotFound) {
+			http.Error(w, "not found", http.StatusNotFound)
+			return
+		}
+		h.jsonError(w, err)
+		return
+	}
+	if entry.Source != memory.SourceResource {
+		http.Error(w, "not a resource entry", http.StatusNotFound)
+		return
+	}
+
+	var req UpdateResourceRequest
+	if err := json.NewDecoder(r.Body).Decode(&req); err != nil {
+		http.Error(w, "invalid request body", http.StatusBadRequest)
+		return
+	}
+	if strings.TrimSpace(req.Content) == "" {
+		http.Error(w, "content is required", http.StatusBadRequest)
+		return
+	}
+
+	if err := h.store.Update(r.Context(), id, req.Content, memory.AuthorHuman, "updated via management API"); err != nil {
+		h.jsonError(w, fmt.Errorf("updating entry: %w", err))
+		return
+	}
+
+	embedding, err := h.embed(r.Context(), req.Content)
+	if err != nil {
+		h.log.Warn("failed to re-embed resource after update", zap.String("id", id), zap.Error(err))
+	} else if err := h.vectors.Upsert(r.Context(), id, embedding); err != nil {
+		h.log.Warn("failed to update embedding after resource update", zap.String("id", id), zap.Error(err))
+	}
+
+	updated, err := h.store.Get(r.Context(), id)
+	if err != nil {
+		h.jsonError(w, err)
+		return
+	}
+
+	h.registerFn(updated)
+	jsonOK(w, entryToResponse(updated))
+}
+
+func (h *Handler) delete(w http.ResponseWriter, r *http.Request, id string) {
+	entry, err := h.store.Get(r.Context(), id)
+	if err != nil {
+		if errors.Is(err, memory.ErrNotFound) {
+			http.Error(w, "not found", http.StatusNotFound)
+			return
+		}
+		h.jsonError(w, err)
+		return
+	}
+	if entry.Source != memory.SourceResource {
+		http.Error(w, "not a resource entry", http.StatusNotFound)
+		return
+	}
+
+	if err := h.store.Delete(r.Context(), id); err != nil {
+		h.jsonError(w, fmt.Errorf("deleting entry: %w", err))
+		return
+	}
+	if err := h.vectors.Delete(r.Context(), id); err != nil {
+		h.log.Warn("failed to delete embedding for resource", zap.String("id", id), zap.Error(err))
+	}
+
+	h.unregisterFn(id)
+	w.WriteHeader(http.StatusNoContent)
+}
+
+func (h *Handler) embed(ctx context.Context, text string) ([]float32, error) {
+	return h.embedder.Embed(ctx, text)
+}
+
+func (h *Handler) jsonError(w http.ResponseWriter, err error) {
+	h.log.Warn("resource API error", zap.Error(err))
+	w.Header().Set("Content-Type", "application/json")
+	w.WriteHeader(http.StatusInternalServerError)
+	_ = json.NewEncoder(w).Encode(map[string]string{"error": err.Error()})
+}
+
+func jsonOK(w http.ResponseWriter, v any) {
+	w.Header().Set("Content-Type", "application/json")
+	_ = json.NewEncoder(w).Encode(v)
+}
+
+func parsePagination(r *http.Request) (limit, offset int) {
+	limit = defaultListLimit
+	if l := r.URL.Query().Get("limit"); l != "" {
+		if v, err := strconv.Atoi(l); err == nil && v > 0 {
+			limit = min(v, maxListLimit)
+		}
+	}
+	if o := r.URL.Query().Get("offset"); o != "" {
+		if v, err := strconv.Atoi(o); err == nil && v >= 0 {
+			offset = v
+		}
+	}
+	return limit, offset
+}
diff --git a/cmd/thv-memory/server.go b/cmd/thv-memory/server.go
index 09cf635883..97c5acb675 100644
--- a/cmd/thv-memory/server.go
+++ b/cmd/thv-memory/server.go
@@ -4,8 +4,13 @@
 package main
 
 import (
+	"context"
+	"errors"
+	"fmt"
 	"net/http"
+	"strings"
 
+	"github.com/mark3labs/mcp-go/mcp"
 	"github.com/mark3labs/mcp-go/server"
 	"go.uber.org/zap"
 
@@ -13,13 +18,20 @@ import (
 	"github.com/stacklok/toolhive/pkg/memory"
 )
 
-const mcpEndpointPath = "/mcp"
+const (
+	mcpEndpointPath     = "/mcp"
+	resourceURIPrefix   = "memory://resource/"
+	resourceURITemplate = "memory://resource/{id}"
+)
 
-// newHandler builds the MCP server, registers all memory tools, and returns an
-// http.Handler that serves the MCP streamable-HTTP transport on /mcp plus a
-// /health liveness probe.
-func newHandler(cfg *Config, svc *memory.Service, store memory.Store, log *zap.Logger) http.Handler {
-	s := server.NewMCPServer(cfg.Server.Name, cfg.Server.Version)
+// newMCPServer creates the MCP server and registers all memory tools.
+// Resource capabilities (listChanged) are enabled so connected agents
+// receive notifications/resources/list_changed whenever a resource is
+// created or deleted via the management API.
+func newMCPServer(cfg *Config, svc *memory.Service, store memory.Store) *server.MCPServer {
+	s := server.NewMCPServer(cfg.Server.Name, cfg.Server.Version,
+		server.WithResourceCapabilities(false, true),
+	)
 
 	tools.RegisterRemember(s, svc)
 	tools.RegisterSearch(s, svc)
@@ -31,6 +43,64 @@ func newHandler(cfg *Config, svc *memory.Service, store memory.Store, log *zap.L
 	tools.RegisterConsolidate(s, svc, store)
 	tools.RegisterCrystallize(s, store)
 
+	// URI template allows agents to probe a resource by known ID without listing.
+	s.AddResourceTemplate(
+		mcp.NewResourceTemplate(resourceURITemplate, "Memory Resource",
+			mcp.WithTemplateDescription("A UI-managed reference document stored in the memory server."),
+			mcp.WithTemplateMIMEType("text/plain"),
+		),
+		server.ResourceTemplateHandlerFunc(makeResourceReadHandler(store)),
+	)
+
+	return s
+}
+
+// LoadExistingResources registers all persisted resource entries with the MCP
+// server at startup so they appear in resources/list immediately.
+func LoadExistingResources(ctx context.Context, s *server.MCPServer, store memory.Store, log *zap.Logger) {
+	src := memory.SourceResource
+	entries, err := store.List(ctx, memory.ListFilter{Source: &src, Limit: 1000})
+	if err != nil {
+		log.Warn("failed to load existing resources", zap.Error(err))
+		return
+	}
+	for _, e := range entries {
+		registerResource(s, store, e)
+	}
+	log.Debug("loaded existing resources", zap.Int("count", len(entries)))
+}
+
+// RegisterResourceEntry adds a resource entry to the MCP server listing.
+// mcp-go automatically sends notifications/resources/list_changed to all
+// connected sessions when WithResourceCapabilities listChanged is true.
+func RegisterResourceEntry(s *server.MCPServer, store memory.Store, e memory.Entry) {
+	// Remove any previous registration (e.g., on update with name change).
+	s.DeleteResources(resourceURIPrefix + e.ID)
+	registerResource(s, store, e)
+}
+
+// UnregisterResourceEntry removes a resource entry from the MCP server listing.
+func UnregisterResourceEntry(s *server.MCPServer, id string) {
+	s.DeleteResources(resourceURIPrefix + id)
+}
+
+func registerResource(s *server.MCPServer, store memory.Store, e memory.Entry) {
+	name := resourceName(e)
+	s.AddResource(
+		mcp.NewResource(resourceURIPrefix+e.ID, name,
+			mcp.WithResourceDescription(fmt.Sprintf("Resource entry %s", e.ID)),
+			mcp.WithMIMEType("text/plain"),
+		),
+		makeResourceReadHandler(store),
+	)
+}
+
+// newHandler wraps the MCP server in the streamable-HTTP transport and
+// returns a mux that exposes:
+//   - /mcp        — MCP streamable-HTTP transport
+//   - /api/       — Management REST API (resource CRUD for UI)
+//   - /health     — Liveness probe
+func newHandler(s *server.MCPServer, resourceAPI http.Handler, log *zap.Logger) http.Handler {
 	log.Debug("registered memory MCP tools", zap.String("endpoint", mcpEndpointPath))
 
 	streamable := server.NewStreamableHTTPServer(s,
@@ -41,6 +111,43 @@ func newHandler(cfg *Config, svc *memory.Service, store memory.Store, log *zap.L
 	mux.HandleFunc("/health", func(w http.ResponseWriter, _ *http.Request) {
 		w.WriteHeader(http.StatusOK)
 	})
+	mux.Handle("/api/", resourceAPI)
 	mux.Handle("/", streamable)
 	return mux
 }
+
+// makeResourceReadHandler returns a handler that reads entry content from the
+// store. When store is nil the handler is a no-op placeholder replaced at
+// resource-registration time by AddResource with a proper store reference.
+func makeResourceReadHandler(store memory.Store) server.ResourceHandlerFunc {
+	return func(ctx context.Context, req mcp.ReadResourceRequest) ([]mcp.ResourceContents, error) {
+		if store == nil {
+			return nil, errors.New("resource store not initialised")
+		}
+		id, ok := strings.CutPrefix(req.Params.URI, resourceURIPrefix)
+		if !ok || id == "" {
+			return nil, fmt.Errorf("invalid resource URI: %s", req.Params.URI)
+		}
+		entry, err := store.Get(ctx, id)
+		if err != nil {
+			return nil, err
+		}
+		return []mcp.ResourceContents{
+			mcp.TextResourceContents{
+				URI:      req.Params.URI,
+				MIMEType: "text/plain",
+				Text:     entry.Content,
+			},
+		}, nil
+	}
+}
+
+// resourceName returns a short display name for a resource entry.
+// Uses the first 60 characters of content as the name.
+func resourceName(e memory.Entry) string {
+	name := e.Content
+	if len(name) > 60 {
+		name = name[:60] + "…"
+	}
+	return name
+}
diff --git a/cmd/thv-memory/tools/flag.go b/cmd/thv-memory/tools/flag.go
index e7e648e74c..db1e986d42 100644
--- a/cmd/thv-memory/tools/flag.go
+++ b/cmd/thv-memory/tools/flag.go
@@ -22,6 +22,9 @@ func RegisterFlag(s *server.MCPServer, store memory.Store) {
 	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
 		id := req.GetString("id", "")
 		reason := req.GetString("reason", "")
+		if err := checkMutable(ctx, store, id); err != nil {
+			return mcp.NewToolResultError(err.Error()), nil
+		}
 		if err := store.Flag(ctx, id, reason); err != nil {
 			return mcp.NewToolResultError(err.Error()), nil
 		}
diff --git a/cmd/thv-memory/tools/forget.go b/cmd/thv-memory/tools/forget.go
index 8ea8c27dee..0c88ed1a43 100644
--- a/cmd/thv-memory/tools/forget.go
+++ b/cmd/thv-memory/tools/forget.go
@@ -20,6 +20,9 @@ func RegisterForget(s *server.MCPServer, store memory.Store) {
 	)
 	s.AddTool(tool, func(ctx context.Context, req mcp.CallToolRequest) (*mcp.CallToolResult, error) {
 		id := req.GetString("id", "")
+		if err := checkMutable(ctx, store, id); err != nil {
+			return mcp.NewToolResultError(err.Error()), nil
+		}
 		if err := store.Delete(ctx, id); err != nil {
 			return mcp.NewToolResultError(err.Error()), nil
 		}
diff --git a/cmd/thv-memory/tools/helpers.go b/cmd/thv-memory/tools/helpers.go
new file mode 100644
index 0000000000..c8e262bb16
--- /dev/null
+++ b/cmd/thv-memory/tools/helpers.go
@@ -0,0 +1,25 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+package tools
+
+import (
+	"context"
+	"fmt"
+
+	"github.com/stacklok/toolhive/pkg/memory"
+)
+
+// checkMutable returns an error if the entry's source type is read-only to
+// agents (SourceSkill or SourceResource). These entries may only be modified
+// via the management REST API, not via MCP tool calls.
+func checkMutable(ctx context.Context, store memory.Store, id string) error {
+	entry, err := store.Get(ctx, id)
+	if err != nil {
+		return err
+	}
+	if entry.Source == memory.SourceSkill || entry.Source == memory.SourceResource {
+		return fmt.Errorf("entry %q (source=%s): %w", id, entry.Source, memory.ErrReadOnly)
+	}
+	return nil
+}
diff --git a/cmd/thv-memory/tools/update.go b/cmd/thv-memory/tools/update.go
index c2925f6618..07cd9f2f2d 100644
--- a/cmd/thv-memory/tools/update.go
+++ b/cmd/thv-memory/tools/update.go
@@ -31,6 +31,9 @@ func RegisterUpdate(s *server.MCPServer, store memory.Store) {
 		}
 		note := req.GetString("correction_note", "")
 
+		if err := checkMutable(ctx, store, id); err != nil {
+			return mcp.NewToolResultError(err.Error()), nil
+		}
 		if err := store.Update(ctx, id, content, memory.AuthorType(authorStr), note); err != nil {
 			return mcp.NewToolResultError(err.Error()), nil
 		}
diff --git a/pkg/memory/errors.go b/pkg/memory/errors.go
index b17a40c1a2..77aa21a1da 100644
--- a/pkg/memory/errors.go
+++ b/pkg/memory/errors.go
@@ -7,3 +7,8 @@ import "errors"
 
 // ErrNotFound is returned when a memory entry does not exist.
 var ErrNotFound = errors.New("memory entry not found")
+
+// ErrReadOnly is returned when an agent attempts to mutate an entry whose
+// source type is read-only (SourceSkill or SourceResource). Use the
+// management REST API to modify resource entries.
+var ErrReadOnly = errors.New("memory entry is read-only")
diff --git a/pkg/memory/sqlite/vector.go b/pkg/memory/sqlite/vector.go
index 49b1cb5d6f..a0e734833b 100644
--- a/pkg/memory/sqlite/vector.go
+++ b/pkg/memory/sqlite/vector.go
@@ -59,6 +59,10 @@ func (v *VectorStore) Search(
 		q += " AND m.status=?"
 		args = append(args, string(*filter.Status))
 	}
+	if filter.Source != nil {
+		q += " AND m.source=?"
+		args = append(args, string(*filter.Source))
+	}
 
 	rows, err := v.db.QueryContext(ctx, q, args...)
 	if err != nil {
diff --git a/pkg/memory/types.go b/pkg/memory/types.go
index 4af892eb74..7369656d3b 100644
--- a/pkg/memory/types.go
+++ b/pkg/memory/types.go
@@ -40,6 +40,11 @@ const (
 	SourceMemory SourceType = "memory"
 	// SourceSkill indicates the entry is a read-only index of an installed Skill.
 	SourceSkill SourceType = "skill"
+	// SourceResource indicates the entry is a UI-managed resource document that
+	// is read-only to agents. Resources are written via the management REST API
+	// and are progressively discovered by agents through memory_search and MCP
+	// Resources protocol (resources/list, resources/read).
+	SourceResource SourceType = "resource"
 )
 
 // EntryStatus is the lifecycle state of a memory entry.
@@ -123,6 +128,7 @@ type ListFilter struct {
 type VectorFilter struct {
 	Type   *Type
 	Status *EntryStatus
+	Source *SourceType
 }
 
 // ScoredID pairs an entry ID with its cosine similarity to a query.

From cea385920feaf9fcfc2c776933762d955663b763 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Fri, 24 Apr 2026 14:19:22 -0400
Subject: [PATCH 07/23] Add recruiter scenario demo for memory server
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Demonstrates all memory types in a realistic hiring workflow: a recruiter
and hiring manager share memory across separate MCP sessions, showing how
episodic and semantic memories prevent repeated mistakes (visa/salary
mismatches) and how procedural patterns crystallize into a reusable Skill.

demo/recruiter/
  Makefile                — build, start, demo, teardown in one place
  cmd/demo/main.go        — Go binary: 7-phase recruiter scenario
  config/memory-server.yaml.tmpl — demo server config (port 8765, SQLite)
  data/job-description.txt       — Senior Go Engineer JD ($100K–$150K)
  demo.tape               — VHS recording script

Run: cd demo/recruiter && make all
     cd demo/recruiter && make teardown  (repeat)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/Makefile                       | 131 ++++++
 demo/recruiter/cmd/demo/main.go               | 391 ++++++++++++++++++
 demo/recruiter/config/memory-server.yaml.tmpl |  15 +
 demo/recruiter/data/job-description.txt       |  88 ++++
 demo/recruiter/demo.tape                      |  93 +++++
 5 files changed, 718 insertions(+)
 create mode 100644 demo/recruiter/Makefile
 create mode 100644 demo/recruiter/cmd/demo/main.go
 create mode 100644 demo/recruiter/config/memory-server.yaml.tmpl
 create mode 100644 demo/recruiter/data/job-description.txt
 create mode 100644 demo/recruiter/demo.tape

diff --git a/demo/recruiter/Makefile b/demo/recruiter/Makefile
new file mode 100644
index 0000000000..d1f496ca87
--- /dev/null
+++ b/demo/recruiter/Makefile
@@ -0,0 +1,131 @@
+# ══════════════════════════════════════════════════════════════════════════════
+# ToolHive Memory Demo — The Recruiter Scenario
+# ══════════════════════════════════════════════════════════════════════════════
+#
+# Prerequisites
+#   • Ollama running locally with nomic-embed-text pulled
+#       brew install ollama && ollama pull nomic-embed-text && ollama serve
+#   • Go 1.22+
+#
+# Quick start
+#   make all          — build binaries, start server, run demo, stop server
+#   make demo         — run demo only  (server must already be running)
+#   make teardown     — stop server, delete DB and demo binary (safe to repeat)
+#
+# Individual targets
+#   make build        — build thv-memory server + demo binary
+#   make server-start — start memory server in background
+#   make server-stop  — stop memory server
+#   make server-logs  — tail server log file
+#   make status       — check server health
+# ══════════════════════════════════════════════════════════════════════════════
+
+SHELL := /bin/bash
+.DEFAULT_GOAL := all
+
+# Locate the worktree root (parent of demo/recruiter)
+WORKTREE_ROOT := $(shell cd ../.. && pwd)
+
+# Binaries
+SERVER_BIN  := $(WORKTREE_ROOT)/bin/thv-memory
+DEMO_BIN    := $(CURDIR)/.demo-bin
+
+# Server config (generated from template)
+CONFIG_TMPL := $(CURDIR)/config/memory-server.yaml.tmpl
+CONFIG      := $(CURDIR)/config/memory-server.yaml
+
+# Runtime files (all cleaned by teardown)
+DB_FILE     := $(CURDIR)/demo-memory.db
+PID_FILE    := $(CURDIR)/.server.pid
+LOG_FILE    := $(CURDIR)/.server.log
+
+# Demo server port — non-standard to avoid conflicts with anything on 8080
+PORT        := 8765
+BASE_URL    := http://127.0.0.1:$(PORT)
+
+# Env for the demo binary
+DEMO_ENV := \
+  MEMORY_MCP_URL=$(BASE_URL)/mcp \
+  MEMORY_API_URL=$(BASE_URL)/api/resources \
+  MEMORY_JD_FILE=$(CURDIR)/data/job-description.txt
+
+.PHONY: all demo build server-start server-stop server-wait server-logs status teardown
+
+# ── all: one-shot full demo ───────────────────────────────────────────────────
+all: build server-start server-wait demo server-stop
+
+# ── demo: run scenario (server must be up) ────────────────────────────────────
+demo: $(DEMO_BIN)
+	@echo ""
+	$(DEMO_ENV) $(DEMO_BIN)
+
+# ── build: compile both binaries ─────────────────────────────────────────────
+build: $(SERVER_BIN) $(DEMO_BIN)
+
+$(SERVER_BIN):
+	@echo "▶  Building thv-memory server..."
+	cd $(WORKTREE_ROOT) && task build
+	@echo "✓  $(SERVER_BIN)"
+
+$(DEMO_BIN): $(CURDIR)/cmd/demo/main.go
+	@echo "▶  Building demo binary..."
+	cd $(WORKTREE_ROOT) && go build -o $(DEMO_BIN) ./demo/recruiter/cmd/demo/
+	@echo "✓  $(DEMO_BIN)"
+
+# ── server config (generated from template) ──────────────────────────────────
+$(CONFIG): $(CONFIG_TMPL)
+	@echo "▶  Generating server config..."
+	@sed 's|DEMO_DB_PATH|$(DB_FILE)|g' $(CONFIG_TMPL) > $(CONFIG)
+	@echo "✓  $(CONFIG)"
+
+# ── server-start ─────────────────────────────────────────────────────────────
+server-start: $(SERVER_BIN) $(CONFIG)
+	@if [ -f $(PID_FILE) ] && kill -0 $$(cat $(PID_FILE)) 2>/dev/null; then \
+	  echo "⚠  Server already running (pid=$$(cat $(PID_FILE)))"; \
+	else \
+	  echo "▶  Starting memory server on port $(PORT)..."; \
+	  MEMORY_CONFIG=$(CONFIG) $(SERVER_BIN) > $(LOG_FILE) 2>&1 & \
+	  echo $$! > $(PID_FILE); \
+	  echo "✓  Server started (pid=$$!, log=$(LOG_FILE))"; \
+	fi
+
+# ── server-wait: poll /health until ready ────────────────────────────────────
+server-wait:
+	@printf "▶  Waiting for server..."
+	@for i in $$(seq 1 30); do \
+	  if curl -sf $(BASE_URL)/health > /dev/null 2>&1; then \
+	    printf " ready!\n"; exit 0; \
+	  fi; \
+	  printf "."; sleep 1; \
+	done; \
+	printf " TIMEOUT\n"; \
+	echo "   Check logs: make server-logs"; \
+	exit 1
+
+# ── server-stop ──────────────────────────────────────────────────────────────
+server-stop:
+	@if [ -f $(PID_FILE) ]; then \
+	  PID=$$(cat $(PID_FILE)); \
+	  kill $$PID 2>/dev/null && echo "✓  Server stopped (pid=$$PID)" || echo "⚠  Process $$PID not found"; \
+	  rm -f $(PID_FILE); \
+	else \
+	  echo "⚠  No PID file found — server may not be running"; \
+	fi
+
+# ── server-logs ──────────────────────────────────────────────────────────────
+server-logs:
+	@tail -f $(LOG_FILE)
+
+# ── status: quick health check ───────────────────────────────────────────────
+status:
+	@if curl -sf $(BASE_URL)/health > /dev/null 2>&1; then \
+	  echo "✓  Server healthy at $(BASE_URL)"; \
+	else \
+	  echo "✗  Server not responding at $(BASE_URL)"; \
+	fi
+
+# ── teardown: stop server + wipe all demo data ───────────────────────────────
+teardown: server-stop
+	@echo "▶  Removing demo data..."
+	@rm -f $(DB_FILE) $(DEMO_BIN) $(LOG_FILE) $(CONFIG)
+	@echo "✓  Teardown complete — safe to run 'make all' again"
diff --git a/demo/recruiter/cmd/demo/main.go b/demo/recruiter/cmd/demo/main.go
new file mode 100644
index 0000000000..df749d3425
--- /dev/null
+++ b/demo/recruiter/cmd/demo/main.go
@@ -0,0 +1,391 @@
+// SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
+// SPDX-License-Identifier: Apache-2.0
+
+// Command demo runs the ToolHive Memory recruiter scenario.
+//
+// It exercises all four memory types (semantic, episodic, procedural, resource),
+// demonstrates cross-session recall between a recruiter and a hiring manager,
+// and finishes by crystallizing the learned interview pattern into a Skill scaffold.
+//
+// Configuration via environment variables:
+//
+//	MEMORY_MCP_URL  — MCP endpoint (default: http://127.0.0.1:8765/mcp)
+//	MEMORY_API_URL  — Resources REST endpoint (default: http://127.0.0.1:8765/api/resources)
+//	MEMORY_JD_FILE  — Path to job description file (default: data/job-description.txt)
+package main
+
+import (
+	"bytes"
+	"context"
+	"encoding/json"
+	"fmt"
+	"net/http"
+	"os"
+	"strings"
+	"time"
+
+	mcpclient "github.com/mark3labs/mcp-go/client"
+	"github.com/mark3labs/mcp-go/client/transport"
+	"github.com/mark3labs/mcp-go/mcp"
+)
+
+// ─── configuration ───────────────────────────────────────────────────────────
+
+var (
+	mcpURL = envOr("MEMORY_MCP_URL", "http://127.0.0.1:8765/mcp")
+	apiURL = envOr("MEMORY_API_URL", "http://127.0.0.1:8765/api/resources")
+	jdFile = envOr("MEMORY_JD_FILE", "data/job-description.txt")
+)
+
+func envOr(key, def string) string {
+	if v := os.Getenv(key); v != "" {
+		return v
+	}
+	return def
+}
+
+// ─── ANSI helpers ─────────────────────────────────────────────────────────────
+
+const (
+	ansiReset  = "\033[0m"
+	ansiBold   = "\033[1m"
+	ansiDim    = "\033[2m"
+	ansiRed    = "\033[31m"
+	ansiGreen  = "\033[32m"
+	ansiYellow = "\033[33m"
+	ansiPurple = "\033[35m"
+	ansiCyan   = "\033[36m"
+	ansiWhite  = "\033[97m"
+	ansiGray   = "\033[90m"
+)
+
+func c(color, s string) string { return color + s + ansiReset }
+
+// ─── main ─────────────────────────────────────────────────────────────────────
+
+func main() {
+	ctx := context.Background()
+
+	jd, err := os.ReadFile(jdFile)
+	if err != nil {
+		fatalf("reading %s: %v\n  Hint: run 'make demo' from demo/recruiter/", jdFile, err)
+	}
+
+	printBanner()
+
+	// ── Phase 1 · Resource ────────────────────────────────────────────────────
+	phase(1, "Resources", "Upload the job description as a static MCP Resource (read-only to agents)")
+	resID := uploadResource(ctx, jd)
+	pause()
+
+	// ── Phase 2 · Semantic Memory ─────────────────────────────────────────────
+	phase(2, "Semantic Memory", "Company-wide facts — any agent session can recall these at any time")
+	shared := newSession(ctx, "shared")
+	defer shared.Close()
+
+	remember(ctx, shared, "semantic",
+		"Company does not sponsor US work visas for any engineering role",
+		"policy", "visa", "hiring")
+	remember(ctx, shared, "semantic",
+		"Senior Go Engineer base salary band: $100,000–$150,000 USD; total comp includes equity",
+		"compensation", "hiring", "senior-go-engineer")
+	remember(ctx, shared, "semantic",
+		"Engineering team is fully remote, US timezone preferred (EST/PST). Async-first culture.",
+		"remote", "culture", "hiring")
+	pause()
+
+	// ── Phase 3 · Session 1 — Recruiter: Alice Chen (2026-04-24) ─────────────
+	phase(3, "Session 1 · Recruiter  —  Interview: Alice Chen", "2026-04-24")
+	recruiter := newSession(ctx, "recruiter")
+	defer recruiter.Close()
+
+	remember(ctx, recruiter, "episodic",
+		"Interviewed Alice Chen on 2026-04-24 for Senior Go Engineer. "+
+			"Strong distributed systems background (8 years Go, ex-Cloudflare). "+
+			"Struggled under time pressure on the consensus algorithm question. "+
+			"Technical screen: pass. Moved to final round with hiring manager.",
+		"alice-chen", "interview", "2026-04-24", "final-round")
+	remember(ctx, recruiter, "episodic",
+		"Alice Chen requires H1B visa sponsorship — ineligible per company policy. "+
+			"Hiring manager loop should be cancelled to avoid wasting candidate and interviewer time.",
+		"alice-chen", "visa", "blocker", "2026-04-24")
+	pause()
+
+	// ── Phase 4 · Session 2 — Hiring Manager: cold search ────────────────────
+	phase(4, "Session 2 · Hiring Manager  —  Searching memory before the Alice call",
+		"Brand new session — no prior context loaded")
+	hm := newSession(ctx, "hiring-manager")
+	defer hm.Close()
+
+	search(ctx, hm, "Alice Chen Senior Go Engineer interview")
+	search(ctx, hm, "visa sponsorship policy")
+	pause()
+
+	// ── Phase 5 · Session 1 — Recruiter: Bob Martinez (2026-04-25) ───────────
+	phase(5, "Session 1 · Recruiter  —  Interview: Bob Martinez", "2026-04-25")
+	remember(ctx, recruiter, "episodic",
+		"Interviewed Bob Martinez on 2026-04-25 for Senior Go Engineer. "+
+			"Strong full-stack background but limited distributed systems experience. "+
+			"Expects $160K base — above the $150K band ceiling. Not progressing.",
+		"bob-martinez", "interview", "2026-04-25")
+	proc1 := remember(ctx, recruiter, "procedural",
+		"Always clarify visa status and salary expectations within the first 15 minutes of "+
+			"every phone screen. Two candidates in this cycle consumed significant recruiter "+
+			"and hiring manager time before disqualifying on logistics.",
+		"phone-screen", "process", "hiring", "lesson-learned")
+	pause()
+
+	// ── Phase 6 · Session 1 — Recruiter: Charlie Kim (2026-04-26) ────────────
+	phase(6, "Session 1 · Recruiter  —  Interview: Charlie Kim", "2026-04-26  ·  HIRE")
+	remember(ctx, recruiter, "episodic",
+		"Interviewed Charlie Kim on 2026-04-26 for Senior Go Engineer. "+
+			"US citizen, no sponsorship needed. 6 years Go, strong Kubernetes and controller-runtime experience. "+
+			"Accepted $135K offer. RECOMMENDED FOR HIRE.",
+		"charlie-kim", "interview", "hire", "2026-04-26")
+	pause()
+
+	// ── Phase 7 · Crystallize → Skill ─────────────────────────────────────────
+	phase(7, "Crystallize  →  Skill", "Promoting the phone-screen pattern to a reusable Skill scaffold")
+	crystallize(ctx, recruiter, "go-eng-phone-screen", proc1)
+	pause()
+
+	printSummary(resID)
+}
+
+// ─── MCP helpers ──────────────────────────────────────────────────────────────
+
+func newSession(ctx context.Context, name string) *mcpclient.Client {
+	t, err := transport.NewStreamableHTTP(mcpURL)
+	if err != nil {
+		fatalf("transport (%s): %v", name, err)
+	}
+	cl := mcpclient.NewClient(t)
+	if err := cl.Start(ctx); err != nil {
+		fatalf("start (%s): %v", name, err)
+	}
+	if _, err := cl.Initialize(ctx, mcp.InitializeRequest{
+		Params: mcp.InitializeParams{
+			ProtocolVersion: mcp.LATEST_PROTOCOL_VERSION,
+			ClientInfo:      mcp.Implementation{Name: "demo-" + name, Version: "1.0"},
+		},
+	}); err != nil {
+		fatalf("initialize (%s): %v", name, err)
+	}
+	fmt.Printf("  %s  Session opened: %s%s\n", c(ansiGray, "→"), c(ansiBold+ansiCyan, name), ansiReset)
+	return cl
+}
+
+func callTool(ctx context.Context, cl *mcpclient.Client, tool string, args map[string]any) string {
+	result, err := cl.CallTool(ctx, mcp.CallToolRequest{
+		Params: mcp.CallToolParams{Name: tool, Arguments: args},
+	})
+	if err != nil {
+		fatalf("tool/%s: %v", tool, err)
+	}
+	for _, content := range result.Content {
+		if tc, ok := content.(mcp.TextContent); ok {
+			return tc.Text
+		}
+	}
+	return ""
+}
+
+func remember(ctx context.Context, cl *mcpclient.Client, memType, content string, tags ...string) string {
+	raw := callTool(ctx, cl, "memory_remember", map[string]any{
+		"content": content,
+		"type":    memType,
+		"author":  "human",
+		"tags":    tags,
+	})
+	var resp struct {
+		Status   string `json:"status"`
+		MemoryID string `json:"memory_id"`
+	}
+	_ = json.Unmarshal([]byte(raw), &resp)
+
+	icon := typeIcon(memType)
+	fmt.Printf("\n  %s %s %s\n",
+		icon,
+		c(ansiBold+typeColor(memType), "["+memType+"]"),
+		truncate(content, 72))
+	if resp.MemoryID != "" {
+		fmt.Printf("      %sid=%-28s tags=%v%s\n", ansiGray, resp.MemoryID, tags, ansiReset)
+	}
+	return resp.MemoryID
+}
+
+func search(ctx context.Context, cl *mcpclient.Client, query string) {
+	fmt.Printf("\n  %s %s\n", c(ansiYellow, "🔍"), c(ansiBold, "search: ")+c(ansiCyan, `"`+query+`"`))
+
+	raw := callTool(ctx, cl, "memory_search", map[string]any{
+		"query": query,
+		"top_k": 3,
+	})
+
+	var results []struct {
+		ID         string  `json:"id"`
+		Content    string  `json:"content"`
+		Type       string  `json:"type"`
+		Similarity float64 `json:"similarity"`
+	}
+	if err := json.Unmarshal([]byte(raw), &results); err != nil || len(results) == 0 {
+		fmt.Printf("     %sno results%s\n", ansiGray, ansiReset)
+		return
+	}
+	for _, r := range results {
+		fmt.Printf("    %s %s %s %s\n",
+			c(ansiGray, fmt.Sprintf("%.2f", r.Similarity)),
+			simBar(r.Similarity),
+			c(ansiDim+typeColor(r.Type), "["+r.Type+"]"),
+			truncate(r.Content, 62))
+	}
+}
+
+func crystallize(ctx context.Context, cl *mcpclient.Client, skillName string, ids ...string) {
+	raw := callTool(ctx, cl, "memory_crystallize", map[string]any{
+		"ids":  ids,
+		"name": skillName,
+	})
+	var resp struct {
+		SkillName string `json:"skill_name"`
+		SkillMD   string `json:"skill_md"`
+		Note      string `json:"note"`
+	}
+	_ = json.Unmarshal([]byte(raw), &resp)
+
+	fmt.Printf("\n  %s Skill scaffold generated: %s\n",
+		c(ansiPurple, "💎"),
+		c(ansiBold+ansiCyan, resp.SkillName))
+	fmt.Printf("  %s %s%s\n\n", ansiGray, resp.Note, ansiReset)
+
+	divider := c(ansiDim, strings.Repeat("─", 62))
+	fmt.Println(divider)
+	lines := strings.Split(resp.SkillMD, "\n")
+	limit := min(len(lines), 14)
+	for _, line := range lines[:limit] {
+		fmt.Printf("  %s%s%s\n", ansiGray, line, ansiReset)
+	}
+	if len(lines) > 14 {
+		fmt.Printf("  %s… (%d more lines)%s\n", ansiGray, len(lines)-14, ansiReset)
+	}
+	fmt.Println(divider)
+}
+
+// ─── Resources REST API helper ─────────────────────────────────────────────────
+
+func uploadResource(ctx context.Context, content []byte) string {
+	body, _ := json.Marshal(map[string]any{
+		"content": string(content),
+		"type":    "semantic",
+		"tags":    []string{"job-description", "senior-go-engineer", "hiring"},
+	})
+
+	req, err := http.NewRequestWithContext(ctx, http.MethodPost, apiURL, bytes.NewReader(body))
+	if err != nil {
+		fatalf("building resource request: %v", err)
+	}
+	req.Header.Set("Content-Type", "application/json")
+
+	resp, err := http.DefaultClient.Do(req)
+	if err != nil {
+		fatalf("POST %s: %v", apiURL, err)
+	}
+	defer resp.Body.Close()
+
+	var r struct {
+		ID string `json:"id"`
+	}
+	_ = json.NewDecoder(resp.Body).Decode(&r)
+
+	fmt.Printf("\n  %s POST /api/resources  ←  Senior Go Engineer job description\n", c(ansiGray, "→"))
+	fmt.Printf("  %s Resource created: %s\n", c(ansiGreen, "✓"), c(ansiCyan, r.ID))
+	fmt.Printf("  %s Agents discover it via memory_search or MCP resources/list%s\n",
+		c(ansiGreen, "✓"), ansiReset)
+	return r.ID
+}
+
+// ─── display helpers ─────────────────────────────────────────────────────────
+
+func printBanner() {
+	bar := strings.Repeat("═", 64)
+	fmt.Printf("\n%s\n", c(ansiBold+ansiCyan, bar))
+	fmt.Printf("%s\n", c(ansiBold+ansiCyan, "  ToolHive Memory Demo — The Recruiter"))
+	fmt.Printf("%s\n", c(ansiCyan, "  Scenario: Hiring a Senior Go Engineer at Stacklok"))
+	fmt.Printf("%s\n\n", c(ansiBold+ansiCyan, bar))
+	fmt.Printf("  MCP endpoint : %s\n", c(ansiGray, mcpURL))
+	fmt.Printf("  REST API     : %s\n\n", c(ansiGray, apiURL))
+}
+
+func phase(n int, title, subtitle string) {
+	bar := strings.Repeat("─", 64)
+	fmt.Printf("\n%s\n", c(ansiYellow, bar))
+	fmt.Printf("  %s\n", c(ansiBold+ansiWhite, fmt.Sprintf("Phase %d · %s", n, title)))
+	if subtitle != "" {
+		fmt.Printf("  %s%s%s\n", ansiGray, subtitle, ansiReset)
+	}
+	fmt.Printf("%s\n", c(ansiYellow, bar))
+}
+
+func printSummary(resourceID string) {
+	bar := strings.Repeat("═", 64)
+	fmt.Printf("\n\n%s\n", c(ansiBold+ansiGreen, bar))
+	fmt.Printf("%s\n", c(ansiBold+ansiGreen, "  Demo complete!"))
+	fmt.Printf("%s\n\n", c(ansiBold+ansiGreen, bar))
+	fmt.Printf("  %-22s %s\n", "Resource uploaded:", c(ansiCyan, resourceID))
+	fmt.Printf("  %-22s %s\n", "Semantic memories:", "3")
+	fmt.Printf("  %-22s %s\n", "Episodic memories:", "4  (Alice, Alice-visa, Bob, Charlie)")
+	fmt.Printf("  %-22s %s\n", "Procedural:", "1  →  crystallized to Skill")
+	fmt.Printf("  %-22s %s\n", "Sessions demoed:", "3  (shared, recruiter, hiring-manager)")
+	fmt.Println()
+	fmt.Printf("  %sTo repeat the demo:%s  make teardown && make all\n\n",
+		ansiGray, ansiReset)
+}
+
+func typeIcon(t string) string {
+	switch t {
+	case "semantic":
+		return "🧠"
+	case "episodic":
+		return "📅"
+	case "procedural":
+		return "📋"
+	default:
+		return "💾"
+	}
+}
+
+func typeColor(t string) string {
+	switch t {
+	case "semantic":
+		return ansiCyan
+	case "episodic":
+		return ansiYellow
+	case "procedural":
+		return ansiPurple
+	default:
+		return ansiWhite
+	}
+}
+
+func simBar(sim float64) string {
+	n := int(sim * 10)
+	n = min(n, 10)
+	return c(ansiGreen, strings.Repeat("█", n)+strings.Repeat("░", 10-n))
+}
+
+func truncate(s string, n int) string {
+	s = strings.Join(strings.Fields(s), " ") // normalize whitespace
+	if len(s) <= n {
+		return s
+	}
+	return s[:n-1] + "…"
+}
+
+func pause() {
+	time.Sleep(200 * time.Millisecond)
+}
+
+func fatalf(format string, args ...any) {
+	fmt.Fprintf(os.Stderr, c(ansiRed, "ERROR: ")+format+"\n", args...)
+	os.Exit(1)
+}
diff --git a/demo/recruiter/config/memory-server.yaml.tmpl b/demo/recruiter/config/memory-server.yaml.tmpl
new file mode 100644
index 0000000000..9e5642ad2b
--- /dev/null
+++ b/demo/recruiter/config/memory-server.yaml.tmpl
@@ -0,0 +1,15 @@
+storage:
+  provider: sqlite
+  dsn: DEMO_DB_PATH
+
+embedder:
+  provider: ollama
+  url: http://localhost:11434
+  model: nomic-embed-text
+
+server:
+  name: "ToolHive Memory Demo"
+  version: "0.1.0"
+  host: "127.0.0.1"
+  port: 8765
+  lifecycle_hours: 720
diff --git a/demo/recruiter/data/job-description.txt b/demo/recruiter/data/job-description.txt
new file mode 100644
index 0000000000..1de97f0c97
--- /dev/null
+++ b/demo/recruiter/data/job-description.txt
@@ -0,0 +1,88 @@
+Senior Software Engineer, Platform (Go)
+Stacklok · Remote (US only)
+
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+
+ABOUT STACKLOK
+
+Stacklok is an open-source security company building tools that help development
+teams trust their software supply chain. We build ToolHive — a lightweight,
+secure manager for Model Context Protocol (MCP) servers — and Minder, an
+open-source policy engine for your software supply chain.
+
+We are a small, fully remote team. Everyone ships production code. We have a
+strong bias toward async communication and written clarity over meetings.
+
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+
+COMPENSATION
+
+Base salary: $100,000 – $150,000 USD (depending on experience and location)
+Total comp includes meaningful equity at an early-stage company.
+
+We do NOT sponsor US work visas. Candidates must be authorized to work in
+the United States without sponsorship now or in the future.
+
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+
+THE ROLE
+
+We are looking for a Senior Software Engineer to join our platform team. You
+will work on the core infrastructure powering ToolHive and contribute to our
+Kubernetes operator (thv-operator).
+
+WHAT YOU WILL DO
+
+• Design and implement distributed systems components for MCP server management
+• Contribute to the Kubernetes operator using controller-runtime and CRDs
+• Build and maintain the MCP proxy runner and authentication middleware
+• Work across pkg/runner, pkg/auth, and cmd/thv layers of the codebase
+• Write clean, well-tested Go with a focus on operational simplicity
+• Review code, mentor peers, and raise the engineering bar across the team
+
+WHAT WE ARE LOOKING FOR
+
+• 5+ years of Go experience in production environments
+• Strong distributed systems fundamentals (consensus, failure modes, back-pressure)
+• Hands-on experience with Kubernetes and controller-runtime
+• Familiarity with container runtimes (Docker, containerd)
+• Strong written communication — we are async-first and documentation matters
+• Comfort with open-source development and working in public
+
+NICE TO HAVE
+
+• Experience with MCP (Model Context Protocol) or similar tool-use protocols
+• Contributions to open-source Go projects
+• Experience with OCI registries and artifact management
+• Familiarity with OIDC, OAuth 2.0, and modern auth patterns
+
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+
+WHAT WE OFFER
+
+• Fully remote (US only, EST/PST timezone preferred)
+• $100,000–$150,000 base salary + equity
+• Comprehensive health, dental, and vision insurance
+• $3,000 annual learning & development stipend
+• 4 weeks PTO + company holidays
+• Home office stipend
+• Async-first culture — no mandatory meetings before 9am your local time
+
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+
+HIRING PROCESS
+
+1. Recruiter phone screen (30 min) — role alignment, logistics, expectations
+2. Technical screen with Go exercises (90 min)
+3. System design interview (60 min)
+4. Final loop: hiring manager + team lead (90 min)
+5. Reference checks → offer
+
+We move quickly. Most candidates complete the process in 2–3 weeks.
+
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+
+TO APPLY
+
+Apply via our careers page or reach out directly at careers@stacklok.com.
+Please include a link to a Go project you are proud of — open source preferred.
diff --git a/demo/recruiter/demo.tape b/demo/recruiter/demo.tape
new file mode 100644
index 0000000000..dab96dc03b
--- /dev/null
+++ b/demo/recruiter/demo.tape
@@ -0,0 +1,93 @@
+# ToolHive Memory Demo — The Recruiter
+# Requires: vhs (brew install vhs), Ollama running, nomic-embed-text pulled
+#
+# Usage:
+#   cd demo/recruiter
+#   vhs demo.tape
+
+Output demo.gif
+Set FontSize 14
+Set Width 140
+Set Height 46
+Set Theme "Dracula"
+Set TypingSpeed 40ms
+Set PlaybackSpeed 1.0
+
+# ── title card ────────────────────────────────────────────────────────────────
+Hide
+Type "echo ''"
+Enter
+Sleep 500ms
+Show
+
+Type "# ToolHive Memory Demo — The Recruiter"
+Sleep 1.5s
+Enter
+Sleep 300ms
+
+Type "# Hiring a Senior Go Engineer at Stacklok"
+Sleep 1.5s
+Enter
+Sleep 500ms
+
+# ── step 1: change to demo dir ────────────────────────────────────────────────
+Type "cd demo/recruiter"
+Sleep 500ms
+Enter
+Sleep 300ms
+
+# ── step 2: build ─────────────────────────────────────────────────────────────
+Type "make build"
+Sleep 500ms
+Enter
+Sleep 15s
+
+# ── step 3: start server ──────────────────────────────────────────────────────
+Type "make server-start"
+Sleep 500ms
+Enter
+Sleep 1s
+
+Type "make server-wait"
+Sleep 500ms
+Enter
+Sleep 5s
+
+# ── step 4: run demo ──────────────────────────────────────────────────────────
+Type "make demo"
+Sleep 500ms
+Enter
+
+# Phase 1: Resource upload (fast — pure HTTP)
+Sleep 3s
+
+# Phase 2: Semantic memories (3 Ollama calls, ~3s each)
+Sleep 12s
+
+# Phase 3: Recruiter session, Alice interviews (2 Ollama calls)
+Sleep 8s
+
+# Phase 4: Hiring manager cold search (2 Ollama calls for query embed)
+Sleep 8s
+
+# Phase 5: Bob + procedural memory (2 Ollama calls)
+Sleep 8s
+
+# Phase 6: Charlie (1 Ollama call)
+Sleep 5s
+
+# Phase 7: Crystallize (no embed needed)
+Sleep 3s
+
+# Summary
+Sleep 3s
+
+# ── step 5: teardown ──────────────────────────────────────────────────────────
+Sleep 1s
+Type "make teardown"
+Sleep 500ms
+Enter
+Sleep 2s
+
+# Final pause
+Sleep 2s

From 51e1249d3e30995dba37cbc2e5c94a92d4a68ecb Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Fri, 24 Apr 2026 14:28:33 -0400
Subject: [PATCH 08/23] Fix demo Makefile to build thv-memory binary directly

task build only compiles bin/thv, not bin/thv-memory.
Use go build directly to produce the correct server binary.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/Makefile | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/demo/recruiter/Makefile b/demo/recruiter/Makefile
index d1f496ca87..caf2dbfb25 100644
--- a/demo/recruiter/Makefile
+++ b/demo/recruiter/Makefile
@@ -64,7 +64,8 @@ build: $(SERVER_BIN) $(DEMO_BIN)
 
 $(SERVER_BIN):
 	@echo "▶  Building thv-memory server..."
-	cd $(WORKTREE_ROOT) && task build
+	@mkdir -p $(WORKTREE_ROOT)/bin
+	cd $(WORKTREE_ROOT) && go build -o $(SERVER_BIN) ./cmd/thv-memory/
 	@echo "✓  $(SERVER_BIN)"
 
 $(DEMO_BIN): $(CURDIR)/cmd/demo/main.go

From b6057876ba840c876674fcb8ba6395ef8915a14b Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Fri, 24 Apr 2026 16:42:10 -0400
Subject: [PATCH 09/23] Fix resource source constraint, add tags to remember
 tool, fix demo parsing

- Migration 003: widen source CHECK to include 'resource' (was only
  'memory','skill'), fixing the constraint violation on resource creation
- remember tool: expose 'tags' parameter so agents can label memories
  at write time (was silently dropped)
- Demo Makefile: teardown now deletes server binary so rebuild always
  picks up new migrations
- Demo binary: add HTTP status check on resource upload; fix JSON field
  names to match Go struct serialisation (MemoryID not memory_id,
  Entry.Content not content at top level)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 cmd/thv-memory/tools/remember.go              |  5 +-
 demo/recruiter/Makefile                       |  2 +-
 demo/recruiter/cmd/demo/main.go               | 26 ++++--
 .../migrations/003_add_resource_source.sql    | 83 +++++++++++++++++++
 4 files changed, 106 insertions(+), 10 deletions(-)
 create mode 100644 pkg/memory/sqlite/migrations/003_add_resource_source.sql

diff --git a/cmd/thv-memory/tools/remember.go b/cmd/thv-memory/tools/remember.go
index 58bb332b3c..585fdcac83 100644
--- a/cmd/thv-memory/tools/remember.go
+++ b/cmd/thv-memory/tools/remember.go
@@ -18,8 +18,9 @@ func RegisterRemember(s *server.MCPServer, svc *memory.Service) {
 	tool := mcp.NewTool("memory_remember",
 		mcp.WithDescription("Store a new semantic or procedural memory. Returns conflict_detected if a similar memory exists."),
 		mcp.WithString("content", mcp.Required(), mcp.Description("The knowledge to store")),
-		mcp.WithString("type", mcp.Required(), mcp.Description("Memory type: semantic or procedural")),
+		mcp.WithString("type", mcp.Required(), mcp.Description("Memory type: semantic, procedural, or episodic")),
 		mcp.WithString("author", mcp.Description("Author type: human or agent (default: agent)")),
+		mcp.WithArray("tags", mcp.Description("Optional labels for filtering and retrieval"), mcp.WithStringItems()),
 		mcp.WithString("session_id", mcp.Description("Originating session ID")),
 		mcp.WithNumber("ttl_days", mcp.Description("Optional TTL in days")),
 		mcp.WithBoolean("force", mcp.Description("Write even if conflicts detected")),
@@ -31,6 +32,7 @@ func RegisterRemember(s *server.MCPServer, svc *memory.Service) {
 		if authorStr == "" {
 			authorStr = "agent"
 		}
+		tags, _ := req.RequireStringSlice("tags") // optional; ignore error when absent
 		force := req.GetBool("force", false)
 		sessionID := req.GetString("session_id", "")
 
@@ -45,6 +47,7 @@ func RegisterRemember(s *server.MCPServer, svc *memory.Service) {
 			Content:   content,
 			Type:      memory.Type(memTypeStr),
 			Author:    memory.AuthorType(authorStr),
+			Tags:      tags,
 			SessionID: sessionID,
 			TTLDays:   ttlDays,
 			Force:     force,
diff --git a/demo/recruiter/Makefile b/demo/recruiter/Makefile
index caf2dbfb25..d6d974c6cf 100644
--- a/demo/recruiter/Makefile
+++ b/demo/recruiter/Makefile
@@ -128,5 +128,5 @@ status:
 # ── teardown: stop server + wipe all demo data ───────────────────────────────
 teardown: server-stop
 	@echo "▶  Removing demo data..."
-	@rm -f $(DB_FILE) $(DEMO_BIN) $(LOG_FILE) $(CONFIG)
+	@rm -f $(DB_FILE) $(DEMO_BIN) $(SERVER_BIN) $(LOG_FILE) $(CONFIG)
 	@echo "✓  Teardown complete — safe to run 'make all' again"
diff --git a/demo/recruiter/cmd/demo/main.go b/demo/recruiter/cmd/demo/main.go
index df749d3425..a8592c76d3 100644
--- a/demo/recruiter/cmd/demo/main.go
+++ b/demo/recruiter/cmd/demo/main.go
@@ -197,9 +197,10 @@ func remember(ctx context.Context, cl *mcpclient.Client, memType, content string
 		"author":  "human",
 		"tags":    tags,
 	})
+	// RememberResult serialises as {"MemoryID":"...","Conflicts":null} (no json tags).
 	var resp struct {
-		Status   string `json:"status"`
-		MemoryID string `json:"memory_id"`
+		MemoryID  string `json:"MemoryID"`
+		Conflicts []any  `json:"Conflicts"`
 	}
 	_ = json.Unmarshal([]byte(raw), &resp)
 
@@ -222,11 +223,14 @@ func search(ctx context.Context, cl *mcpclient.Client, query string) {
 		"top_k": 3,
 	})
 
+	// ScoredEntry serialises as {"Entry":{...},"Similarity":0.xx} (no json tags).
 	var results []struct {
-		ID         string  `json:"id"`
-		Content    string  `json:"content"`
-		Type       string  `json:"type"`
-		Similarity float64 `json:"similarity"`
+		Entry      struct {
+			ID      string `json:"ID"`
+			Content string `json:"Content"`
+			Type    string `json:"Type"`
+		} `json:"Entry"`
+		Similarity float64 `json:"Similarity"`
 	}
 	if err := json.Unmarshal([]byte(raw), &results); err != nil || len(results) == 0 {
 		fmt.Printf("     %sno results%s\n", ansiGray, ansiReset)
@@ -236,8 +240,8 @@ func search(ctx context.Context, cl *mcpclient.Client, query string) {
 		fmt.Printf("    %s %s %s %s\n",
 			c(ansiGray, fmt.Sprintf("%.2f", r.Similarity)),
 			simBar(r.Similarity),
-			c(ansiDim+typeColor(r.Type), "["+r.Type+"]"),
-			truncate(r.Content, 62))
+			c(ansiDim+typeColor(r.Entry.Type), "["+r.Entry.Type+"]"),
+			truncate(r.Entry.Content, 62))
 	}
 }
 
@@ -292,6 +296,12 @@ func uploadResource(ctx context.Context, content []byte) string {
 	}
 	defer resp.Body.Close()
 
+	if resp.StatusCode != http.StatusCreated {
+		var errBody map[string]string
+		_ = json.NewDecoder(resp.Body).Decode(&errBody)
+		fatalf("POST /api/resources returned %d: %v", resp.StatusCode, errBody["error"])
+	}
+
 	var r struct {
 		ID string `json:"id"`
 	}
diff --git a/pkg/memory/sqlite/migrations/003_add_resource_source.sql b/pkg/memory/sqlite/migrations/003_add_resource_source.sql
new file mode 100644
index 0000000000..d1455edf44
--- /dev/null
+++ b/pkg/memory/sqlite/migrations/003_add_resource_source.sql
@@ -0,0 +1,83 @@
+-- +goose Up
+
+-- SQLite does not support ALTER COLUMN, so we recreate the table with the
+-- updated CHECK constraint to include the 'resource' source type.
+
+CREATE TABLE IF NOT EXISTS memory_entries_new (
+    id                TEXT PRIMARY KEY,
+    type              TEXT NOT NULL CHECK (type IN ('semantic','procedural','episodic')),
+    content           TEXT NOT NULL,
+    tags              TEXT NOT NULL DEFAULT '[]',
+    author            TEXT NOT NULL CHECK (author IN ('human','agent')),
+    agent_id          TEXT NOT NULL DEFAULT '',
+    session_id        TEXT NOT NULL DEFAULT '',
+    source            TEXT NOT NULL CHECK (source IN ('memory','skill','resource')),
+    skill_ref         TEXT NOT NULL DEFAULT '',
+    status            TEXT NOT NULL DEFAULT 'active'
+                          CHECK (status IN ('active','flagged','expired','archived')),
+    trust_score       REAL NOT NULL DEFAULT 0,
+    staleness_score   REAL NOT NULL DEFAULT 0,
+    access_count      INTEGER NOT NULL DEFAULT 0,
+    last_accessed_at  TEXT,
+    flagged_at        TEXT,
+    flag_reason       TEXT NOT NULL DEFAULT '',
+    ttl_days          INTEGER,
+    expires_at        TEXT,
+    archived_at       TEXT,
+    consolidated_into TEXT NOT NULL DEFAULT '',
+    crystallized_into TEXT NOT NULL DEFAULT '',
+    created_at        TEXT NOT NULL,
+    updated_at        TEXT NOT NULL
+);
+
+INSERT INTO memory_entries_new SELECT * FROM memory_entries;
+DROP TABLE memory_entries;
+ALTER TABLE memory_entries_new RENAME TO memory_entries;
+
+CREATE INDEX IF NOT EXISTS idx_memory_entries_type_status
+    ON memory_entries(type, status);
+
+CREATE INDEX IF NOT EXISTS idx_memory_entries_expires_at
+    ON memory_entries(expires_at) WHERE expires_at IS NOT NULL;
+
+-- +goose Down
+
+-- Revert: drop resource rows then recreate the narrower constraint.
+DELETE FROM memory_entries WHERE source = 'resource';
+
+CREATE TABLE IF NOT EXISTS memory_entries_old (
+    id                TEXT PRIMARY KEY,
+    type              TEXT NOT NULL CHECK (type IN ('semantic','procedural','episodic')),
+    content           TEXT NOT NULL,
+    tags              TEXT NOT NULL DEFAULT '[]',
+    author            TEXT NOT NULL CHECK (author IN ('human','agent')),
+    agent_id          TEXT NOT NULL DEFAULT '',
+    session_id        TEXT NOT NULL DEFAULT '',
+    source            TEXT NOT NULL CHECK (source IN ('memory','skill')),
+    skill_ref         TEXT NOT NULL DEFAULT '',
+    status            TEXT NOT NULL DEFAULT 'active'
+                          CHECK (status IN ('active','flagged','expired','archived')),
+    trust_score       REAL NOT NULL DEFAULT 0,
+    staleness_score   REAL NOT NULL DEFAULT 0,
+    access_count      INTEGER NOT NULL DEFAULT 0,
+    last_accessed_at  TEXT,
+    flagged_at        TEXT,
+    flag_reason       TEXT NOT NULL DEFAULT '',
+    ttl_days          INTEGER,
+    expires_at        TEXT,
+    archived_at       TEXT,
+    consolidated_into TEXT NOT NULL DEFAULT '',
+    crystallized_into TEXT NOT NULL DEFAULT '',
+    created_at        TEXT NOT NULL,
+    updated_at        TEXT NOT NULL
+);
+
+INSERT INTO memory_entries_old SELECT * FROM memory_entries;
+DROP TABLE memory_entries;
+ALTER TABLE memory_entries_old RENAME TO memory_entries;
+
+CREATE INDEX IF NOT EXISTS idx_memory_entries_type_status
+    ON memory_entries(type, status);
+
+CREATE INDEX IF NOT EXISTS idx_memory_entries_expires_at
+    ON memory_entries(expires_at) WHERE expires_at IS NOT NULL;

From 6db261a31476485a72aa1a51cf304a355dfcfad1 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Fri, 24 Apr 2026 17:06:39 -0400
Subject: [PATCH 10/23] Add Claude Code agent sessions to recruiter demo

Phases 1-2 (resource upload, semantic memory) are handled by the Go setup
binary. Phases 3-7 are now real Claude Code sessions using --print mode so
the demo shows an actual AI agent consuming the memory MCP.

- Add prompts/ directory with per-session prompt files for each phase:
  recruiter-alice, hiring-manager, recruiter-bob, recruiter-charlie, crystallize
- Add Makefile targets: session-recruiter-alice, session-hiring-manager,
  session-recruiter-bob, session-recruiter-charlie, session-crystallize
- Add mcp-config target that generates .demo.mcp.json for Claude Code
- Update demo target to run setup binary then all five agent sessions in sequence
- Update demo.tape VHS recording to show Claude Code session targets
- Teardown now also removes .demo.mcp.json

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/Makefile                      |  78 ++++++-
 demo/recruiter/cmd/demo/main.go              | 225 +++++--------------
 demo/recruiter/demo.tape                     |  75 ++++---
 demo/recruiter/prompts/crystallize.txt       |  13 ++
 demo/recruiter/prompts/hiring-manager.txt    |  12 +
 demo/recruiter/prompts/recruiter-alice.txt   |  14 ++
 demo/recruiter/prompts/recruiter-bob.txt     |  15 ++
 demo/recruiter/prompts/recruiter-charlie.txt |  12 +
 8 files changed, 241 insertions(+), 203 deletions(-)
 create mode 100644 demo/recruiter/prompts/crystallize.txt
 create mode 100644 demo/recruiter/prompts/hiring-manager.txt
 create mode 100644 demo/recruiter/prompts/recruiter-alice.txt
 create mode 100644 demo/recruiter/prompts/recruiter-bob.txt
 create mode 100644 demo/recruiter/prompts/recruiter-charlie.txt

diff --git a/demo/recruiter/Makefile b/demo/recruiter/Makefile
index d6d974c6cf..7f79119e44 100644
--- a/demo/recruiter/Makefile
+++ b/demo/recruiter/Makefile
@@ -6,10 +6,12 @@
 #   • Ollama running locally with nomic-embed-text pulled
 #       brew install ollama && ollama pull nomic-embed-text && ollama serve
 #   • Go 1.22+
+#   • Claude Code CLI installed and authenticated (for agent sessions)
+#       npm install -g @anthropic-ai/claude-code
 #
 # Quick start
-#   make all          — build binaries, start server, run demo, stop server
-#   make demo         — run demo only  (server must already be running)
+#   make all          — build binaries, start server, run full demo, stop server
+#   make demo         — run full demo  (server must already be running)
 #   make teardown     — stop server, delete DB and demo binary (safe to repeat)
 #
 # Individual targets
@@ -18,6 +20,13 @@
 #   make server-stop  — stop memory server
 #   make server-logs  — tail server log file
 #   make status       — check server health
+#
+# Agent sessions (run individually after setup phase)
+#   make session-recruiter-alice   — Phase 3: recruiter records Alice's phone screen
+#   make session-hiring-manager    — Phase 4: hiring manager searches memory cold
+#   make session-recruiter-bob     — Phase 5: recruiter records Bob + procedural lesson
+#   make session-recruiter-charlie — Phase 6: recruiter uses checklist, records Charlie
+#   make session-crystallize       — Phase 7: crystallize phone-screen pattern → Skill
 # ══════════════════════════════════════════════════════════════════════════════
 
 SHELL := /bin/bash
@@ -43,21 +52,78 @@ LOG_FILE    := $(CURDIR)/.server.log
 PORT        := 8765
 BASE_URL    := http://127.0.0.1:$(PORT)
 
+# MCP config file for Claude Code agent sessions
+MCP_CONFIG  := $(CURDIR)/.demo.mcp.json
+
 # Env for the demo binary
 DEMO_ENV := \
   MEMORY_MCP_URL=$(BASE_URL)/mcp \
   MEMORY_API_URL=$(BASE_URL)/api/resources \
   MEMORY_JD_FILE=$(CURDIR)/data/job-description.txt
 
-.PHONY: all demo build server-start server-stop server-wait server-logs status teardown
+.PHONY: all demo build \
+        server-start server-stop server-wait server-logs status \
+        mcp-config \
+        session-recruiter-alice session-hiring-manager \
+        session-recruiter-bob session-recruiter-charlie \
+        session-crystallize \
+        teardown
 
 # ── all: one-shot full demo ───────────────────────────────────────────────────
 all: build server-start server-wait demo server-stop
 
-# ── demo: run scenario (server must be up) ────────────────────────────────────
-demo: $(DEMO_BIN)
+# ── demo: run full scenario (server must be up) ───────────────────────────────
+# Runs setup (Phases 1-2) then all five Claude Code agent sessions (Phases 3-7)
+demo: $(DEMO_BIN) mcp-config
 	@echo ""
 	$(DEMO_ENV) $(DEMO_BIN)
+	@$(MAKE) --no-print-directory session-recruiter-alice
+	@$(MAKE) --no-print-directory session-hiring-manager
+	@$(MAKE) --no-print-directory session-recruiter-bob
+	@$(MAKE) --no-print-directory session-recruiter-charlie
+	@$(MAKE) --no-print-directory session-crystallize
+
+# ── mcp-config: generate MCP config for Claude Code sessions ─────────────────
+mcp-config:
+	@printf '{\n  "mcpServers": {\n    "toolhive-memory": {\n      "type": "http",\n      "url": "$(BASE_URL)/mcp"\n    }\n  }\n}\n' > $(MCP_CONFIG)
+	@echo "✓  MCP config written to $(MCP_CONFIG)"
+
+# ── agent sessions (Phase 3-7) ────────────────────────────────────────────────
+
+session-recruiter-alice: mcp-config
+	@echo ""
+	@echo "═══════════════════════════════════════════════════════════════"
+	@echo "  Phase 3 · Recruiter Session — Alice Chen phone screen"
+	@echo "═══════════════════════════════════════════════════════════════"
+	claude --print --mcp-config $(MCP_CONFIG) -p "$$(cat $(CURDIR)/prompts/recruiter-alice.txt)"
+
+session-hiring-manager: mcp-config
+	@echo ""
+	@echo "═══════════════════════════════════════════════════════════════"
+	@echo "  Phase 4 · Hiring Manager — cold memory search"
+	@echo "═══════════════════════════════════════════════════════════════"
+	claude --print --mcp-config $(MCP_CONFIG) -p "$$(cat $(CURDIR)/prompts/hiring-manager.txt)"
+
+session-recruiter-bob: mcp-config
+	@echo ""
+	@echo "═══════════════════════════════════════════════════════════════"
+	@echo "  Phase 5 · Recruiter Session — Bob Martinez + procedural lesson"
+	@echo "═══════════════════════════════════════════════════════════════"
+	claude --print --mcp-config $(MCP_CONFIG) -p "$$(cat $(CURDIR)/prompts/recruiter-bob.txt)"
+
+session-recruiter-charlie: mcp-config
+	@echo ""
+	@echo "═══════════════════════════════════════════════════════════════"
+	@echo "  Phase 6 · Recruiter Session — Charlie Kim (HIRE)"
+	@echo "═══════════════════════════════════════════════════════════════"
+	claude --print --mcp-config $(MCP_CONFIG) -p "$$(cat $(CURDIR)/prompts/recruiter-charlie.txt)"
+
+session-crystallize: mcp-config
+	@echo ""
+	@echo "═══════════════════════════════════════════════════════════════"
+	@echo "  Phase 7 · Crystallize — phone-screen pattern → Skill"
+	@echo "═══════════════════════════════════════════════════════════════"
+	claude --print --mcp-config $(MCP_CONFIG) -p "$$(cat $(CURDIR)/prompts/crystallize.txt)"
 
 # ── build: compile both binaries ─────────────────────────────────────────────
 build: $(SERVER_BIN) $(DEMO_BIN)
@@ -128,5 +194,5 @@ status:
 # ── teardown: stop server + wipe all demo data ───────────────────────────────
 teardown: server-stop
 	@echo "▶  Removing demo data..."
-	@rm -f $(DB_FILE) $(DEMO_BIN) $(SERVER_BIN) $(LOG_FILE) $(CONFIG)
+	@rm -f $(DB_FILE) $(DEMO_BIN) $(SERVER_BIN) $(LOG_FILE) $(CONFIG) $(MCP_CONFIG)
 	@echo "✓  Teardown complete — safe to run 'make all' again"
diff --git a/demo/recruiter/cmd/demo/main.go b/demo/recruiter/cmd/demo/main.go
index a8592c76d3..d8f4147ecd 100644
--- a/demo/recruiter/cmd/demo/main.go
+++ b/demo/recruiter/cmd/demo/main.go
@@ -1,11 +1,11 @@
 // SPDX-FileCopyrightText: Copyright 2025 Stacklok, Inc.
 // SPDX-License-Identifier: Apache-2.0
 
-// Command demo runs the ToolHive Memory recruiter scenario.
+// Command demo is the automated setup phase of the ToolHive Memory recruiter demo.
 //
-// It exercises all four memory types (semantic, episodic, procedural, resource),
-// demonstrates cross-session recall between a recruiter and a hiring manager,
-// and finishes by crystallizing the learned interview pattern into a Skill scaffold.
+// It handles Phase 1 (upload the job description as a static MCP Resource and
+// print it in full) and Phase 2 (write shared semantic memories). Phases 3-7
+// are run as real Claude Code agent sessions — see the Makefile targets.
 //
 // Configuration via environment variables:
 //
@@ -50,7 +50,6 @@ const (
 	ansiReset  = "\033[0m"
 	ansiBold   = "\033[1m"
 	ansiDim    = "\033[2m"
-	ansiRed    = "\033[31m"
 	ansiGreen  = "\033[32m"
 	ansiYellow = "\033[33m"
 	ansiPurple = "\033[35m"
@@ -59,7 +58,7 @@ const (
 	ansiGray   = "\033[90m"
 )
 
-func c(color, s string) string { return color + s + ansiReset }
+func col(color, s string) string { return color + s + ansiReset }
 
 // ─── main ─────────────────────────────────────────────────────────────────────
 
@@ -68,7 +67,7 @@ func main() {
 
 	jd, err := os.ReadFile(jdFile)
 	if err != nil {
-		fatalf("reading %s: %v\n  Hint: run 'make demo' from demo/recruiter/", jdFile, err)
+		fatalf("reading %s: %v\n  Hint: run from demo/recruiter/ directory", jdFile, err)
 	}
 
 	printBanner()
@@ -76,80 +75,26 @@ func main() {
 	// ── Phase 1 · Resource ────────────────────────────────────────────────────
 	phase(1, "Resources", "Upload the job description as a static MCP Resource (read-only to agents)")
 	resID := uploadResource(ctx, jd)
+	printJobDescription(jd)
 	pause()
 
 	// ── Phase 2 · Semantic Memory ─────────────────────────────────────────────
-	phase(2, "Semantic Memory", "Company-wide facts — any agent session can recall these at any time")
-	shared := newSession(ctx, "shared")
-	defer shared.Close()
+	phase(2, "Semantic Memory", "Company-wide facts — written once, recalled by any agent session at any time")
+	cl := newSession(ctx, "setup")
+	defer cl.Close()
 
-	remember(ctx, shared, "semantic",
+	remember(ctx, cl, "semantic",
 		"Company does not sponsor US work visas for any engineering role",
 		"policy", "visa", "hiring")
-	remember(ctx, shared, "semantic",
+	remember(ctx, cl, "semantic",
 		"Senior Go Engineer base salary band: $100,000–$150,000 USD; total comp includes equity",
 		"compensation", "hiring", "senior-go-engineer")
-	remember(ctx, shared, "semantic",
+	remember(ctx, cl, "semantic",
 		"Engineering team is fully remote, US timezone preferred (EST/PST). Async-first culture.",
 		"remote", "culture", "hiring")
 	pause()
 
-	// ── Phase 3 · Session 1 — Recruiter: Alice Chen (2026-04-24) ─────────────
-	phase(3, "Session 1 · Recruiter  —  Interview: Alice Chen", "2026-04-24")
-	recruiter := newSession(ctx, "recruiter")
-	defer recruiter.Close()
-
-	remember(ctx, recruiter, "episodic",
-		"Interviewed Alice Chen on 2026-04-24 for Senior Go Engineer. "+
-			"Strong distributed systems background (8 years Go, ex-Cloudflare). "+
-			"Struggled under time pressure on the consensus algorithm question. "+
-			"Technical screen: pass. Moved to final round with hiring manager.",
-		"alice-chen", "interview", "2026-04-24", "final-round")
-	remember(ctx, recruiter, "episodic",
-		"Alice Chen requires H1B visa sponsorship — ineligible per company policy. "+
-			"Hiring manager loop should be cancelled to avoid wasting candidate and interviewer time.",
-		"alice-chen", "visa", "blocker", "2026-04-24")
-	pause()
-
-	// ── Phase 4 · Session 2 — Hiring Manager: cold search ────────────────────
-	phase(4, "Session 2 · Hiring Manager  —  Searching memory before the Alice call",
-		"Brand new session — no prior context loaded")
-	hm := newSession(ctx, "hiring-manager")
-	defer hm.Close()
-
-	search(ctx, hm, "Alice Chen Senior Go Engineer interview")
-	search(ctx, hm, "visa sponsorship policy")
-	pause()
-
-	// ── Phase 5 · Session 1 — Recruiter: Bob Martinez (2026-04-25) ───────────
-	phase(5, "Session 1 · Recruiter  —  Interview: Bob Martinez", "2026-04-25")
-	remember(ctx, recruiter, "episodic",
-		"Interviewed Bob Martinez on 2026-04-25 for Senior Go Engineer. "+
-			"Strong full-stack background but limited distributed systems experience. "+
-			"Expects $160K base — above the $150K band ceiling. Not progressing.",
-		"bob-martinez", "interview", "2026-04-25")
-	proc1 := remember(ctx, recruiter, "procedural",
-		"Always clarify visa status and salary expectations within the first 15 minutes of "+
-			"every phone screen. Two candidates in this cycle consumed significant recruiter "+
-			"and hiring manager time before disqualifying on logistics.",
-		"phone-screen", "process", "hiring", "lesson-learned")
-	pause()
-
-	// ── Phase 6 · Session 1 — Recruiter: Charlie Kim (2026-04-26) ────────────
-	phase(6, "Session 1 · Recruiter  —  Interview: Charlie Kim", "2026-04-26  ·  HIRE")
-	remember(ctx, recruiter, "episodic",
-		"Interviewed Charlie Kim on 2026-04-26 for Senior Go Engineer. "+
-			"US citizen, no sponsorship needed. 6 years Go, strong Kubernetes and controller-runtime experience. "+
-			"Accepted $135K offer. RECOMMENDED FOR HIRE.",
-		"charlie-kim", "interview", "hire", "2026-04-26")
-	pause()
-
-	// ── Phase 7 · Crystallize → Skill ─────────────────────────────────────────
-	phase(7, "Crystallize  →  Skill", "Promoting the phone-screen pattern to a reusable Skill scaffold")
-	crystallize(ctx, recruiter, "go-eng-phone-screen", proc1)
-	pause()
-
-	printSummary(resID)
+	printHandoff(resID)
 }
 
 // ─── MCP helpers ──────────────────────────────────────────────────────────────
@@ -171,7 +116,7 @@ func newSession(ctx context.Context, name string) *mcpclient.Client {
 	}); err != nil {
 		fatalf("initialize (%s): %v", name, err)
 	}
-	fmt.Printf("  %s  Session opened: %s%s\n", c(ansiGray, "→"), c(ansiBold+ansiCyan, name), ansiReset)
+	fmt.Printf("  %s  Session opened: %s\n", col(ansiGray, "→"), col(ansiBold+ansiCyan, name))
 	return cl
 }
 
@@ -197,7 +142,7 @@ func remember(ctx context.Context, cl *mcpclient.Client, memType, content string
 		"author":  "human",
 		"tags":    tags,
 	})
-	// RememberResult serialises as {"MemoryID":"...","Conflicts":null} (no json tags).
+	// RememberResult serialises without json tags: {"MemoryID":"...","Conflicts":null}
 	var resp struct {
 		MemoryID  string `json:"MemoryID"`
 		Conflicts []any  `json:"Conflicts"`
@@ -207,74 +152,14 @@ func remember(ctx context.Context, cl *mcpclient.Client, memType, content string
 	icon := typeIcon(memType)
 	fmt.Printf("\n  %s %s %s\n",
 		icon,
-		c(ansiBold+typeColor(memType), "["+memType+"]"),
+		col(ansiBold+typeColor(memType), "["+memType+"]"),
 		truncate(content, 72))
 	if resp.MemoryID != "" {
-		fmt.Printf("      %sid=%-28s tags=%v%s\n", ansiGray, resp.MemoryID, tags, ansiReset)
+		fmt.Printf("      %sid=%-36s tags=%v%s\n", ansiGray, resp.MemoryID, tags, ansiReset)
 	}
 	return resp.MemoryID
 }
 
-func search(ctx context.Context, cl *mcpclient.Client, query string) {
-	fmt.Printf("\n  %s %s\n", c(ansiYellow, "🔍"), c(ansiBold, "search: ")+c(ansiCyan, `"`+query+`"`))
-
-	raw := callTool(ctx, cl, "memory_search", map[string]any{
-		"query": query,
-		"top_k": 3,
-	})
-
-	// ScoredEntry serialises as {"Entry":{...},"Similarity":0.xx} (no json tags).
-	var results []struct {
-		Entry      struct {
-			ID      string `json:"ID"`
-			Content string `json:"Content"`
-			Type    string `json:"Type"`
-		} `json:"Entry"`
-		Similarity float64 `json:"Similarity"`
-	}
-	if err := json.Unmarshal([]byte(raw), &results); err != nil || len(results) == 0 {
-		fmt.Printf("     %sno results%s\n", ansiGray, ansiReset)
-		return
-	}
-	for _, r := range results {
-		fmt.Printf("    %s %s %s %s\n",
-			c(ansiGray, fmt.Sprintf("%.2f", r.Similarity)),
-			simBar(r.Similarity),
-			c(ansiDim+typeColor(r.Entry.Type), "["+r.Entry.Type+"]"),
-			truncate(r.Entry.Content, 62))
-	}
-}
-
-func crystallize(ctx context.Context, cl *mcpclient.Client, skillName string, ids ...string) {
-	raw := callTool(ctx, cl, "memory_crystallize", map[string]any{
-		"ids":  ids,
-		"name": skillName,
-	})
-	var resp struct {
-		SkillName string `json:"skill_name"`
-		SkillMD   string `json:"skill_md"`
-		Note      string `json:"note"`
-	}
-	_ = json.Unmarshal([]byte(raw), &resp)
-
-	fmt.Printf("\n  %s Skill scaffold generated: %s\n",
-		c(ansiPurple, "💎"),
-		c(ansiBold+ansiCyan, resp.SkillName))
-	fmt.Printf("  %s %s%s\n\n", ansiGray, resp.Note, ansiReset)
-
-	divider := c(ansiDim, strings.Repeat("─", 62))
-	fmt.Println(divider)
-	lines := strings.Split(resp.SkillMD, "\n")
-	limit := min(len(lines), 14)
-	for _, line := range lines[:limit] {
-		fmt.Printf("  %s%s%s\n", ansiGray, line, ansiReset)
-	}
-	if len(lines) > 14 {
-		fmt.Printf("  %s… (%d more lines)%s\n", ansiGray, len(lines)-14, ansiReset)
-	}
-	fmt.Println(divider)
-}
-
 // ─── Resources REST API helper ─────────────────────────────────────────────────
 
 func uploadResource(ctx context.Context, content []byte) string {
@@ -286,7 +171,7 @@ func uploadResource(ctx context.Context, content []byte) string {
 
 	req, err := http.NewRequestWithContext(ctx, http.MethodPost, apiURL, bytes.NewReader(body))
 	if err != nil {
-		fatalf("building resource request: %v", err)
+		fatalf("building request: %v", err)
 	}
 	req.Header.Set("Content-Type", "application/json")
 
@@ -307,48 +192,56 @@ func uploadResource(ctx context.Context, content []byte) string {
 	}
 	_ = json.NewDecoder(resp.Body).Decode(&r)
 
-	fmt.Printf("\n  %s POST /api/resources  ←  Senior Go Engineer job description\n", c(ansiGray, "→"))
-	fmt.Printf("  %s Resource created: %s\n", c(ansiGreen, "✓"), c(ansiCyan, r.ID))
-	fmt.Printf("  %s Agents discover it via memory_search or MCP resources/list%s\n",
-		c(ansiGreen, "✓"), ansiReset)
+	fmt.Printf("\n  %s POST /api/resources  ←  Senior Go Engineer job description\n", col(ansiGray, "→"))
+	fmt.Printf("  %s Resource registered: %s\n", col(ansiGreen, "✓"), col(ansiCyan, r.ID))
+	fmt.Printf("  %s Agents discover it via memory_search or MCP resources/list\n", col(ansiGreen, "✓"))
 	return r.ID
 }
 
+func printJobDescription(content []byte) {
+	divider := col(ansiDim, strings.Repeat("─", 64))
+	fmt.Printf("\n%s\n", divider)
+	for _, line := range strings.Split(string(content), "\n") {
+		fmt.Printf("  %s%s%s\n", ansiGray, line, ansiReset)
+	}
+	fmt.Printf("%s\n", divider)
+}
+
 // ─── display helpers ─────────────────────────────────────────────────────────
 
 func printBanner() {
 	bar := strings.Repeat("═", 64)
-	fmt.Printf("\n%s\n", c(ansiBold+ansiCyan, bar))
-	fmt.Printf("%s\n", c(ansiBold+ansiCyan, "  ToolHive Memory Demo — The Recruiter"))
-	fmt.Printf("%s\n", c(ansiCyan, "  Scenario: Hiring a Senior Go Engineer at Stacklok"))
-	fmt.Printf("%s\n\n", c(ansiBold+ansiCyan, bar))
-	fmt.Printf("  MCP endpoint : %s\n", c(ansiGray, mcpURL))
-	fmt.Printf("  REST API     : %s\n\n", c(ansiGray, apiURL))
+	fmt.Printf("\n%s\n", col(ansiBold+ansiCyan, bar))
+	fmt.Printf("%s\n", col(ansiBold+ansiCyan, "  ToolHive Memory Demo — The Recruiter"))
+	fmt.Printf("%s\n", col(ansiCyan, "  Scenario: Hiring a Senior Go Engineer at Stacklok"))
+	fmt.Printf("%s\n\n", col(ansiBold+ansiCyan, bar))
+	fmt.Printf("  Server : %s\n\n", col(ansiGray, mcpURL))
 }
 
 func phase(n int, title, subtitle string) {
 	bar := strings.Repeat("─", 64)
-	fmt.Printf("\n%s\n", c(ansiYellow, bar))
-	fmt.Printf("  %s\n", c(ansiBold+ansiWhite, fmt.Sprintf("Phase %d · %s", n, title)))
+	fmt.Printf("\n%s\n", col(ansiYellow, bar))
+	fmt.Printf("  %s\n", col(ansiBold+ansiWhite, fmt.Sprintf("Phase %d · %s", n, title)))
 	if subtitle != "" {
 		fmt.Printf("  %s%s%s\n", ansiGray, subtitle, ansiReset)
 	}
-	fmt.Printf("%s\n", c(ansiYellow, bar))
+	fmt.Printf("%s\n", col(ansiYellow, bar))
 }
 
-func printSummary(resourceID string) {
+func printHandoff(resourceID string) {
 	bar := strings.Repeat("═", 64)
-	fmt.Printf("\n\n%s\n", c(ansiBold+ansiGreen, bar))
-	fmt.Printf("%s\n", c(ansiBold+ansiGreen, "  Demo complete!"))
-	fmt.Printf("%s\n\n", c(ansiBold+ansiGreen, bar))
-	fmt.Printf("  %-22s %s\n", "Resource uploaded:", c(ansiCyan, resourceID))
-	fmt.Printf("  %-22s %s\n", "Semantic memories:", "3")
-	fmt.Printf("  %-22s %s\n", "Episodic memories:", "4  (Alice, Alice-visa, Bob, Charlie)")
-	fmt.Printf("  %-22s %s\n", "Procedural:", "1  →  crystallized to Skill")
-	fmt.Printf("  %-22s %s\n", "Sessions demoed:", "3  (shared, recruiter, hiring-manager)")
-	fmt.Println()
-	fmt.Printf("  %sTo repeat the demo:%s  make teardown && make all\n\n",
-		ansiGray, ansiReset)
+	fmt.Printf("\n\n%s\n", col(ansiBold+ansiGreen, bar))
+	fmt.Printf("%s\n", col(ansiBold+ansiGreen, "  Setup complete — memory server is primed"))
+	fmt.Printf("%s\n\n", col(ansiBold+ansiGreen, bar))
+	fmt.Printf("  Resource : %s\n", col(ansiCyan, resourceID))
+	fmt.Printf("  Semantic : 3 company-wide facts written\n\n")
+	fmt.Printf("  %sNext: run the agent sessions to see Claude use the memory:%s\n\n", ansiBold, ansiReset)
+	fmt.Printf("    %smake session-recruiter-alice%s   — recruiter records Alice Chen's interview\n", ansiCyan, ansiReset)
+	fmt.Printf("    %smake session-hiring-manager%s    — hiring manager searches cold\n", ansiCyan, ansiReset)
+	fmt.Printf("    %smake session-recruiter-bob%s     — recruiter records Bob + procedural lesson\n", ansiCyan, ansiReset)
+	fmt.Printf("    %smake session-recruiter-charlie%s — recruiter records Charlie (HIRE)\n", ansiCyan, ansiReset)
+	fmt.Printf("    %smake session-crystallize%s       — crystallize phone-screen pattern → Skill\n\n", ansiCyan, ansiReset)
+	fmt.Printf("    %smake demo%s                      — run all sessions in sequence\n\n", ansiPurple, ansiReset)
 }
 
 func typeIcon(t string) string {
@@ -377,25 +270,17 @@ func typeColor(t string) string {
 	}
 }
 
-func simBar(sim float64) string {
-	n := int(sim * 10)
-	n = min(n, 10)
-	return c(ansiGreen, strings.Repeat("█", n)+strings.Repeat("░", 10-n))
-}
-
 func truncate(s string, n int) string {
-	s = strings.Join(strings.Fields(s), " ") // normalize whitespace
+	s = strings.Join(strings.Fields(s), " ")
 	if len(s) <= n {
 		return s
 	}
 	return s[:n-1] + "…"
 }
 
-func pause() {
-	time.Sleep(200 * time.Millisecond)
-}
+func pause() { time.Sleep(200 * time.Millisecond) }
 
 func fatalf(format string, args ...any) {
-	fmt.Fprintf(os.Stderr, c(ansiRed, "ERROR: ")+format+"\n", args...)
+	fmt.Fprintf(os.Stderr, col(ansiGreen, "ERROR: ")+format+"\n", args...)
 	os.Exit(1)
 }
diff --git a/demo/recruiter/demo.tape b/demo/recruiter/demo.tape
index dab96dc03b..ddc026bb6c 100644
--- a/demo/recruiter/demo.tape
+++ b/demo/recruiter/demo.tape
@@ -1,5 +1,6 @@
 # ToolHive Memory Demo — The Recruiter
-# Requires: vhs (brew install vhs), Ollama running, nomic-embed-text pulled
+# Requires: vhs (brew install vhs), Ollama running, nomic-embed-text pulled,
+#           Claude Code CLI installed and authenticated (npm i -g @anthropic-ai/claude-code)
 #
 # Usage:
 #   cd demo/recruiter
@@ -7,8 +8,8 @@
 
 Output demo.gif
 Set FontSize 14
-Set Width 140
-Set Height 46
+Set Width 160
+Set Height 50
 Set Theme "Dracula"
 Set TypingSpeed 40ms
 Set PlaybackSpeed 1.0
@@ -43,51 +44,71 @@ Enter
 Sleep 15s
 
 # ── step 3: start server ──────────────────────────────────────────────────────
-Type "make server-start"
+Type "make server-start server-wait"
 Sleep 500ms
 Enter
-Sleep 1s
+Sleep 8s
 
-Type "make server-wait"
+# ── step 4: setup phase (resource upload + semantic memories) ─────────────────
+Type "# Phase 1-2: Upload job description and prime shared memory"
+Sleep 1s
+Enter
+Sleep 300ms
+Type "make demo"
 Sleep 500ms
 Enter
+
+# Phase 1: Resource upload + print JD (fast — pure HTTP)
 Sleep 5s
 
-# ── step 4: run demo ──────────────────────────────────────────────────────────
-Type "make demo"
+# Phase 2: Semantic memories (3 Ollama embedding calls, ~3s each)
+Sleep 12s
+
+# ── step 5: recruiter session — Alice Chen ────────────────────────────────────
+Type "make session-recruiter-alice"
 Sleep 500ms
 Enter
 
-# Phase 1: Resource upload (fast — pure HTTP)
-Sleep 3s
+# Claude Code: checks visa policy via memory_search, records 3 episodic memories
+Sleep 30s
 
-# Phase 2: Semantic memories (3 Ollama calls, ~3s each)
-Sleep 12s
+# ── step 6: hiring manager cold search ───────────────────────────────────────
+Type "make session-hiring-manager"
+Sleep 500ms
+Enter
 
-# Phase 3: Recruiter session, Alice interviews (2 Ollama calls)
-Sleep 8s
+# Claude Code: 4 independent memory_search calls, reports pipeline state
+Sleep 30s
 
-# Phase 4: Hiring manager cold search (2 Ollama calls for query embed)
-Sleep 8s
+# ── step 7: recruiter session — Bob Martinez ─────────────────────────────────
+Type "make session-recruiter-bob"
+Sleep 500ms
+Enter
 
-# Phase 5: Bob + procedural memory (2 Ollama calls)
-Sleep 8s
+# Claude Code: checks pipeline, records episodic + procedural memory
+Sleep 35s
 
-# Phase 6: Charlie (1 Ollama call)
-Sleep 5s
+# ── step 8: recruiter session — Charlie Kim ───────────────────────────────────
+Type "make session-recruiter-charlie"
+Sleep 500ms
+Enter
 
-# Phase 7: Crystallize (no embed needed)
-Sleep 3s
+# Claude Code: retrieves phone-screen checklist, records Charlie advancing
+Sleep 30s
 
-# Summary
-Sleep 3s
+# ── step 9: crystallize pattern into a Skill ──────────────────────────────────
+Type "make session-crystallize"
+Sleep 500ms
+Enter
 
-# ── step 5: teardown ──────────────────────────────────────────────────────────
-Sleep 1s
+# Claude Code: lists procedural memory, crystallizes → SKILL.md scaffold
+Sleep 25s
+
+# ── step 10: teardown ────────────────────────────────────────────────────────
 Type "make teardown"
 Sleep 500ms
 Enter
-Sleep 2s
+Sleep 3s
 
 # Final pause
 Sleep 2s
diff --git a/demo/recruiter/prompts/crystallize.txt b/demo/recruiter/prompts/crystallize.txt
new file mode 100644
index 0000000000..213a8297cf
--- /dev/null
+++ b/demo/recruiter/prompts/crystallize.txt
@@ -0,0 +1,13 @@
+You are a senior recruiter at Stacklok doing a retrospective after the first week of phone screens for the Senior Go Engineer role.
+
+Step 1: Use memory_list with type=procedural to retrieve all procedural memories related to hiring.
+
+Step 2: Use memory_search to query "phone screen pattern lessons learned hiring" to find any related episodic observations.
+
+Step 3: Use memory_crystallize with the IDs of the procedural memories you found. Use name="senior-go-engineer-phone-screen-playbook". This will produce a SKILL.md scaffold — a reusable, versioned interview runbook.
+
+Step 4: Report the crystallize output verbatim so the team can review it as a candidate skill artifact.
+
+This demonstrates how fluid procedural knowledge (lessons learned mid-hiring-process) gets promoted into a structured, versioned runbook that any recruiter can follow in future hiring cycles.
+
+Be concise — just use the tools and show the output.
diff --git a/demo/recruiter/prompts/hiring-manager.txt b/demo/recruiter/prompts/hiring-manager.txt
new file mode 100644
index 0000000000..36d5ec3f17
--- /dev/null
+++ b/demo/recruiter/prompts/hiring-manager.txt
@@ -0,0 +1,12 @@
+You are the hiring manager for the Senior Go Engineer role at Stacklok. You are doing a cold check on the pipeline — you have not been involved in any recruiter sessions.
+
+Use memory_search to answer the following questions. Issue each search separately and report what you find:
+
+1. Search "candidates phone screen" — what candidates have been screened so far?
+2. Search "visa sponsorship" — does the company sponsor work visas?
+3. Search "salary compensation senior go engineer" — what is the approved compensation range?
+4. Search "job description senior go engineer" — retrieve the job requirements.
+
+After all searches, write a brief summary: what do you know about the pipeline so far, and what salary range should offers stay within?
+
+Be concise and grounded in what the memory search returns — do not invent facts.
diff --git a/demo/recruiter/prompts/recruiter-alice.txt b/demo/recruiter/prompts/recruiter-alice.txt
new file mode 100644
index 0000000000..dfcf9af9f4
--- /dev/null
+++ b/demo/recruiter/prompts/recruiter-alice.txt
@@ -0,0 +1,14 @@
+You are a recruiter at Stacklok. You have just finished a phone screen with Alice Chen for the Senior Go Engineer role.
+
+Use the memory_remember tool to record the following observations from Alice's phone screen as EPISODIC memories (time-indexed events). Use author="human" and tags relevant to each fact.
+
+Facts to record:
+1. Alice Chen: 8 years Go experience, strong distributed systems background. Currently at Google. Asking $160K base. Requires H1-B visa transfer — she is on OPT expiring in 6 months.
+2. Alice phone screen completed 2024-03-10. Strong technical fit but visa situation is a blocker — company does not sponsor work visas.
+3. Decision: Alice Chen archived — visa sponsorship required, company policy prohibits it. Candidate pool status: 1 archived.
+
+Before recording, use memory_search to check if there are any existing company policies about visa sponsorship that you should be aware of. Query: "visa sponsorship policy".
+
+After recording all three memories, use memory_list with type=episodic to confirm they were saved.
+
+Be concise — just use the tools and report what you stored.
diff --git a/demo/recruiter/prompts/recruiter-bob.txt b/demo/recruiter/prompts/recruiter-bob.txt
new file mode 100644
index 0000000000..1727982649
--- /dev/null
+++ b/demo/recruiter/prompts/recruiter-bob.txt
@@ -0,0 +1,15 @@
+You are a recruiter at Stacklok. You have just finished a phone screen with Bob Martinez for the Senior Go Engineer role.
+
+Before recording anything, use memory_search to check existing pipeline context: query "candidates phone screen pipeline".
+
+Use memory_remember to record the following as EPISODIC memories (author="human"):
+1. Bob Martinez: 5 years Go, mostly microservices. US citizen, no visa issues. Asking $145K base — within band. Weak on distributed systems fundamentals; struggled explaining consensus algorithms.
+2. Bob phone screen completed 2024-03-12. Technically below bar for senior level. Archived.
+3. Pattern observed: two candidates archived in a row due to either visa issues or weak distributed systems knowledge. Phone screen question on consensus algorithms is a strong signal.
+
+Now record the following as a PROCEDURAL memory — a learned process from these screens (author="human", tags: ["hiring", "phone-screen", "process"]):
+"Phone screen gate for Senior Go Engineer: (1) confirm visa/work-auth status in first 5 minutes — saves everyone's time if there is a blocker; (2) ask candidate to explain Raft or Paxos at a high level — weak answers here correlate strongly with underperformance in distributed systems work."
+
+After recording, use memory_list with type=procedural to confirm the procedure was saved.
+
+Be concise — just use the tools and report what you stored.
diff --git a/demo/recruiter/prompts/recruiter-charlie.txt b/demo/recruiter/prompts/recruiter-charlie.txt
new file mode 100644
index 0000000000..03eb83ef9c
--- /dev/null
+++ b/demo/recruiter/prompts/recruiter-charlie.txt
@@ -0,0 +1,12 @@
+You are a recruiter at Stacklok. You are about to start a phone screen with Charlie Kim for the Senior Go Engineer role.
+
+First, use memory_search to retrieve your phone screen checklist: query "phone screen gate process senior go engineer". Review the procedure.
+
+Now record the phone screen results as EPISODIC memories (author="human"):
+1. Charlie Kim: 7 years Go, previously built distributed storage at AWS. US citizen. Asking $140K base — within band. Excellent on consensus algorithms (explained Raft clearly, discussed leader election edge cases). Strong communication skills.
+2. Charlie phone screen completed 2024-03-15. Strong technical fit, compensation within band, no blockers. Advancing to technical interview loop.
+3. Candidate pipeline update: Alice Chen archived (visa), Bob Martinez archived (below bar), Charlie Kim advancing to interview loop. Pipeline health: 1 active of 3 screened.
+
+After recording, use memory_search to query "advancing interview loop" to confirm Charlie's record is discoverable, then provide a brief pipeline status summary.
+
+Be concise — just use the tools and report what you stored.

From 6fa82252a3977ebec1209bb26f98ccc816996698 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Sun, 26 Apr 2026 17:37:54 -0400
Subject: [PATCH 11/23] Rewrite demo prompts as natural recruiter chat
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Previous prompts told Claude which tools to call and in what order.
They now read like real messages a recruiter would type — the agent
discovers visa policy, logs outcomes, and crystallizes runbooks on its
own by deciding when to reach for memory_search, memory_remember, and
memory_crystallize.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/prompts/crystallize.txt       | 14 +-------------
 demo/recruiter/prompts/hiring-manager.txt    | 13 +------------
 demo/recruiter/prompts/recruiter-alice.txt   | 15 +++------------
 demo/recruiter/prompts/recruiter-bob.txt     | 16 +++-------------
 demo/recruiter/prompts/recruiter-charlie.txt | 13 ++++---------
 5 files changed, 12 insertions(+), 59 deletions(-)

diff --git a/demo/recruiter/prompts/crystallize.txt b/demo/recruiter/prompts/crystallize.txt
index 213a8297cf..57b4a5a285 100644
--- a/demo/recruiter/prompts/crystallize.txt
+++ b/demo/recruiter/prompts/crystallize.txt
@@ -1,13 +1 @@
-You are a senior recruiter at Stacklok doing a retrospective after the first week of phone screens for the Senior Go Engineer role.
-
-Step 1: Use memory_list with type=procedural to retrieve all procedural memories related to hiring.
-
-Step 2: Use memory_search to query "phone screen pattern lessons learned hiring" to find any related episodic observations.
-
-Step 3: Use memory_crystallize with the IDs of the procedural memories you found. Use name="senior-go-engineer-phone-screen-playbook". This will produce a SKILL.md scaffold — a reusable, versioned interview runbook.
-
-Step 4: Report the crystallize output verbatim so the team can review it as a candidate skill artifact.
-
-This demonstrates how fluid procedural knowledge (lessons learned mid-hiring-process) gets promoted into a structured, versioned runbook that any recruiter can follow in future hiring cycles.
-
-Be concise — just use the tools and show the output.
+We've wrapped up the first week of screens for the Senior Go Engineer role. I want to turn what we learned into something the whole recruiting team can reuse — a proper runbook for future phone screens so we're not reinventing this every time. Can you put that together based on what we've figured out?
diff --git a/demo/recruiter/prompts/hiring-manager.txt b/demo/recruiter/prompts/hiring-manager.txt
index 36d5ec3f17..7a3ab9b116 100644
--- a/demo/recruiter/prompts/hiring-manager.txt
+++ b/demo/recruiter/prompts/hiring-manager.txt
@@ -1,12 +1 @@
-You are the hiring manager for the Senior Go Engineer role at Stacklok. You are doing a cold check on the pipeline — you have not been involved in any recruiter sessions.
-
-Use memory_search to answer the following questions. Issue each search separately and report what you find:
-
-1. Search "candidates phone screen" — what candidates have been screened so far?
-2. Search "visa sponsorship" — does the company sponsor work visas?
-3. Search "salary compensation senior go engineer" — what is the approved compensation range?
-4. Search "job description senior go engineer" — retrieve the job requirements.
-
-After all searches, write a brief summary: what do you know about the pipeline so far, and what salary range should offers stay within?
-
-Be concise and grounded in what the memory search returns — do not invent facts.
+Hey, I'm the hiring manager for the Senior Go Engineer opening. I haven't been in the loop on recruiting — can you catch me up? I'd like to know who's been screened so far, where they stand, what the approved comp range looks like, and a reminder of what we're actually hiring for.
diff --git a/demo/recruiter/prompts/recruiter-alice.txt b/demo/recruiter/prompts/recruiter-alice.txt
index dfcf9af9f4..685b431e37 100644
--- a/demo/recruiter/prompts/recruiter-alice.txt
+++ b/demo/recruiter/prompts/recruiter-alice.txt
@@ -1,14 +1,5 @@
-You are a recruiter at Stacklok. You have just finished a phone screen with Alice Chen for the Senior Go Engineer role.
+I just finished a phone screen with Alice Chen for the Senior Go Engineer role. She has 8 years of Go experience, strong distributed systems background, currently at Google. Technically she looks great. Her ask is $160K base.
 
-Use the memory_remember tool to record the following observations from Alice's phone screen as EPISODIC memories (time-indexed events). Use author="human" and tags relevant to each fact.
+One issue: she mentioned she's on OPT and would need an H1-B transfer — her OPT expires in about 6 months. Before I move her forward I want to make sure that's not a blocker. Can you check if we have any policy on that?
 
-Facts to record:
-1. Alice Chen: 8 years Go experience, strong distributed systems background. Currently at Google. Asking $160K base. Requires H1-B visa transfer — she is on OPT expiring in 6 months.
-2. Alice phone screen completed 2024-03-10. Strong technical fit but visa situation is a blocker — company does not sponsor work visas.
-3. Decision: Alice Chen archived — visa sponsorship required, company policy prohibits it. Candidate pool status: 1 archived.
-
-Before recording, use memory_search to check if there are any existing company policies about visa sponsorship that you should be aware of. Query: "visa sponsorship policy".
-
-After recording all three memories, use memory_list with type=episodic to confirm they were saved.
-
-Be concise — just use the tools and report what you stored.
+Also, once you've got that, can you log the outcome of this screen for me so the hiring manager and any other recruiter can see it?
diff --git a/demo/recruiter/prompts/recruiter-bob.txt b/demo/recruiter/prompts/recruiter-bob.txt
index 1727982649..73391bc1c4 100644
--- a/demo/recruiter/prompts/recruiter-bob.txt
+++ b/demo/recruiter/prompts/recruiter-bob.txt
@@ -1,15 +1,5 @@
-You are a recruiter at Stacklok. You have just finished a phone screen with Bob Martinez for the Senior Go Engineer role.
+Just wrapped a screen with Bob Martinez. US citizen, no visa issues. 5 years Go, mostly microservices work. His ask is $145K which seems fine. Technically though he struggled — I asked him to walk me through how Raft works and he couldn't get through it. Felt like he was below bar for senior level.
 
-Before recording anything, use memory_search to check existing pipeline context: query "candidates phone screen pipeline".
+I'm going to archive him. Can you log that and update the pipeline?
 
-Use memory_remember to record the following as EPISODIC memories (author="human"):
-1. Bob Martinez: 5 years Go, mostly microservices. US citizen, no visa issues. Asking $145K base — within band. Weak on distributed systems fundamentals; struggled explaining consensus algorithms.
-2. Bob phone screen completed 2024-03-12. Technically below bar for senior level. Archived.
-3. Pattern observed: two candidates archived in a row due to either visa issues or weak distributed systems knowledge. Phone screen question on consensus algorithms is a strong signal.
-
-Now record the following as a PROCEDURAL memory — a learned process from these screens (author="human", tags: ["hiring", "phone-screen", "process"]):
-"Phone screen gate for Senior Go Engineer: (1) confirm visa/work-auth status in first 5 minutes — saves everyone's time if there is a blocker; (2) ask candidate to explain Raft or Paxos at a high level — weak answers here correlate strongly with underperformance in distributed systems work."
-
-After recording, use memory_list with type=procedural to confirm the procedure was saved.
-
-Be concise — just use the tools and report what you stored.
+Also, this is the second screen in a row where something obvious knocked the candidate out early — visa with Alice, distributed systems fundamentals with Bob. I feel like we could save everyone time if we checked those things right at the start of each call. Worth noting that pattern somewhere so I don't forget it.
diff --git a/demo/recruiter/prompts/recruiter-charlie.txt b/demo/recruiter/prompts/recruiter-charlie.txt
index 03eb83ef9c..4f362ae0d3 100644
--- a/demo/recruiter/prompts/recruiter-charlie.txt
+++ b/demo/recruiter/prompts/recruiter-charlie.txt
@@ -1,12 +1,7 @@
-You are a recruiter at Stacklok. You are about to start a phone screen with Charlie Kim for the Senior Go Engineer role.
+About to jump on a screen with Charlie Kim. Before I start — do we have anything on how to run these calls? I remember we were going to standardize the approach after the last couple of screens didn't go well.
 
-First, use memory_search to retrieve your phone screen checklist: query "phone screen gate process senior go engineer". Review the procedure.
+---
 
-Now record the phone screen results as EPISODIC memories (author="human"):
-1. Charlie Kim: 7 years Go, previously built distributed storage at AWS. US citizen. Asking $140K base — within band. Excellent on consensus algorithms (explained Raft clearly, discussed leader election edge cases). Strong communication skills.
-2. Charlie phone screen completed 2024-03-15. Strong technical fit, compensation within band, no blockers. Advancing to technical interview loop.
-3. Candidate pipeline update: Alice Chen archived (visa), Bob Martinez archived (below bar), Charlie Kim advancing to interview loop. Pipeline health: 1 active of 3 screened.
+[30 minutes later]
 
-After recording, use memory_search to query "advancing interview loop" to confirm Charlie's record is discoverable, then provide a brief pipeline status summary.
-
-Be concise — just use the tools and report what you stored.
+That went really well. Charlie has 7 years of Go, spent time at AWS building distributed storage. US citizen. Asking $140K. He explained Raft clearly and even got into leader election edge cases without me prompting him. Great communicator too. I want to move him to the full interview loop. Can you record this and give me a quick status on where the pipeline stands overall?

From 51054d5237c06eb9d7208e422e2b21d1770f9a02 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Tue, 28 Apr 2026 15:23:31 -0400
Subject: [PATCH 12/23] =?UTF-8?q?Make=20demo=20sessions=20interactive=20?=
 =?UTF-8?q?=E2=80=94=20print=20prompt=20and=20wait?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Instead of running claude --print automatically, each session target
now prints the prompt to use and pauses until Enter is pressed. This
lets you run the Claude Code session yourself (with the MCP config
shown) before the demo advances to the next phase.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/Makefile | 41 ++++++++++++++++++-----------------------
 1 file changed, 18 insertions(+), 23 deletions(-)

diff --git a/demo/recruiter/Makefile b/demo/recruiter/Makefile
index 7f79119e44..e723e5e69a 100644
--- a/demo/recruiter/Makefile
+++ b/demo/recruiter/Makefile
@@ -89,41 +89,36 @@ mcp-config:
 	@echo "✓  MCP config written to $(MCP_CONFIG)"
 
 # ── agent sessions (Phase 3-7) ────────────────────────────────────────────────
+# Each session prints the prompt to use, then waits for you to run it in
+# Claude Code (claude --mcp-config .demo.mcp.json) and press Enter to continue.
 
-session-recruiter-alice: mcp-config
+define print-prompt
 	@echo ""
 	@echo "═══════════════════════════════════════════════════════════════"
-	@echo "  Phase 3 · Recruiter Session — Alice Chen phone screen"
+	@echo "  $(1)"
+	@echo "  MCP config: $(MCP_CONFIG)"
 	@echo "═══════════════════════════════════════════════════════════════"
-	claude --print --mcp-config $(MCP_CONFIG) -p "$$(cat $(CURDIR)/prompts/recruiter-alice.txt)"
+	@echo ""
+	@cat $(2)
+	@echo ""
+	@echo "───────────────────────────────────────────────────────────────"
+	@read -p "  ↑ Use this prompt in Claude Code, then press Enter to continue... " _
+endef
+
+session-recruiter-alice: mcp-config
+	$(call print-prompt,Phase 3 · Recruiter Session — Alice Chen phone screen,$(CURDIR)/prompts/recruiter-alice.txt)
 
 session-hiring-manager: mcp-config
-	@echo ""
-	@echo "═══════════════════════════════════════════════════════════════"
-	@echo "  Phase 4 · Hiring Manager — cold memory search"
-	@echo "═══════════════════════════════════════════════════════════════"
-	claude --print --mcp-config $(MCP_CONFIG) -p "$$(cat $(CURDIR)/prompts/hiring-manager.txt)"
+	$(call print-prompt,Phase 4 · Hiring Manager — cold memory search,$(CURDIR)/prompts/hiring-manager.txt)
 
 session-recruiter-bob: mcp-config
-	@echo ""
-	@echo "═══════════════════════════════════════════════════════════════"
-	@echo "  Phase 5 · Recruiter Session — Bob Martinez + procedural lesson"
-	@echo "═══════════════════════════════════════════════════════════════"
-	claude --print --mcp-config $(MCP_CONFIG) -p "$$(cat $(CURDIR)/prompts/recruiter-bob.txt)"
+	$(call print-prompt,Phase 5 · Recruiter Session — Bob Martinez + procedural lesson,$(CURDIR)/prompts/recruiter-bob.txt)
 
 session-recruiter-charlie: mcp-config
-	@echo ""
-	@echo "═══════════════════════════════════════════════════════════════"
-	@echo "  Phase 6 · Recruiter Session — Charlie Kim (HIRE)"
-	@echo "═══════════════════════════════════════════════════════════════"
-	claude --print --mcp-config $(MCP_CONFIG) -p "$$(cat $(CURDIR)/prompts/recruiter-charlie.txt)"
+	$(call print-prompt,Phase 6 · Recruiter Session — Charlie Kim (HIRE),$(CURDIR)/prompts/recruiter-charlie.txt)
 
 session-crystallize: mcp-config
-	@echo ""
-	@echo "═══════════════════════════════════════════════════════════════"
-	@echo "  Phase 7 · Crystallize — phone-screen pattern → Skill"
-	@echo "═══════════════════════════════════════════════════════════════"
-	claude --print --mcp-config $(MCP_CONFIG) -p "$$(cat $(CURDIR)/prompts/crystallize.txt)"
+	$(call print-prompt,Phase 7 · Crystallize — phone-screen pattern → Skill,$(CURDIR)/prompts/crystallize.txt)
 
 # ── build: compile both binaries ─────────────────────────────────────────────
 build: $(SERVER_BIN) $(DEMO_BIN)

From c31dafc255baf57650fe2ed47ed077fb7926c68d Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Tue, 28 Apr 2026 16:50:35 -0400
Subject: [PATCH 13/23] Clean up Claude-written local files between demo runs

The crystallize session produced a phone-screen-runbook.md in data/,
which on the next run Claude found on disk and short-circuited the
memory server entirely. Teardown now deletes any .md files from data/
and .gitignore prevents them from being committed.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/Makefile        | 1 +
 demo/recruiter/data/.gitignore | 2 ++
 2 files changed, 3 insertions(+)
 create mode 100644 demo/recruiter/data/.gitignore

diff --git a/demo/recruiter/Makefile b/demo/recruiter/Makefile
index e723e5e69a..322b675b19 100644
--- a/demo/recruiter/Makefile
+++ b/demo/recruiter/Makefile
@@ -190,4 +190,5 @@ status:
 teardown: server-stop
 	@echo "▶  Removing demo data..."
 	@rm -f $(DB_FILE) $(DEMO_BIN) $(SERVER_BIN) $(LOG_FILE) $(CONFIG) $(MCP_CONFIG)
+	@rm -f $(CURDIR)/data/*.md
 	@echo "✓  Teardown complete — safe to run 'make all' again"
diff --git a/demo/recruiter/data/.gitignore b/demo/recruiter/data/.gitignore
new file mode 100644
index 0000000000..32b11de842
--- /dev/null
+++ b/demo/recruiter/data/.gitignore
@@ -0,0 +1,2 @@
+# Claude-generated runbooks and artifacts from demo sessions
+*.md

From ecab88fe1279783c49c2cd78698b771f8231ea85 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Tue, 28 Apr 2026 18:13:10 -0400
Subject: [PATCH 14/23] Add Reveal.js presentation for memory architecture demo
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

15-slide deck covering the architecture (memory types, lifecycle,
crystallization path) followed by a slide-by-slide walkthrough of
the recruiter scenario. Self-contained HTML — open in browser and
present fullscreen, no build step needed.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/slides.html | 760 +++++++++++++++++++++++++++++++++++++
 1 file changed, 760 insertions(+)
 create mode 100644 demo/recruiter/slides.html

diff --git a/demo/recruiter/slides.html b/demo/recruiter/slides.html
new file mode 100644
index 0000000000..5ac4f0f757
--- /dev/null
+++ b/demo/recruiter/slides.html
@@ -0,0 +1,760 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<meta name="viewport" content="width=device-width, initial-scale=1.0">
+<title>ToolHive Memory — Agentic Shared Memory</title>
+<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/reveal.js@5.1.0/dist/reveal.css">
+<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/reveal.js@5.1.0/dist/theme/night.css">
+<style>
+  :root {
+    --cyan:   #00d4ff;
+    --green:  #48bb78;
+    --yellow: #f6e05e;
+    --purple: #9f7aea;
+    --gray:   #718096;
+    --dim:    #2d3748;
+  }
+
+  .reveal { font-family: 'Segoe UI', system-ui, sans-serif; }
+
+  /* headings */
+  .reveal h1 { color: var(--cyan); font-size: 1.9em; margin-bottom: .3em; }
+  .reveal h2 { color: var(--cyan); font-size: 1.4em; margin-bottom: .4em; }
+  .reveal h3 { color: #e2e8f0; font-size: 1.1em; }
+  .reveal p, .reveal li { color: #cbd5e0; font-size: .88em; }
+
+  /* tag pill */
+  .tag {
+    display: inline-block;
+    padding: 2px 10px;
+    border-radius: 9999px;
+    font-size: .68em;
+    font-weight: 600;
+    letter-spacing: .04em;
+    margin-right: 4px;
+  }
+  .tag-cyan   { background: rgba(0,212,255,.15); color: var(--cyan);   border: 1px solid var(--cyan); }
+  .tag-green  { background: rgba(72,187,120,.15); color: var(--green);  border: 1px solid var(--green); }
+  .tag-yellow { background: rgba(246,224,94,.15); color: var(--yellow); border: 1px solid var(--yellow); }
+  .tag-purple { background: rgba(159,122,234,.15); color: var(--purple); border: 1px solid var(--purple); }
+  .tag-gray   { background: rgba(113,128,150,.15); color: #a0aec0;      border: 1px solid var(--gray); }
+
+  /* memory type cards */
+  .card-grid { display: grid; grid-template-columns: 1fr 1fr; gap: 16px; margin-top: 12px; }
+  .card {
+    background: rgba(255,255,255,.05);
+    border: 1px solid rgba(255,255,255,.1);
+    border-radius: 10px;
+    padding: 16px 18px;
+    text-align: left;
+  }
+  .card .icon { font-size: 1.5em; }
+  .card .title { font-size: .85em; font-weight: 700; margin: 6px 0 4px; }
+  .card .desc  { font-size: .72em; color: #718096; line-height: 1.4; }
+
+  /* phase list */
+  .phase-list { list-style: none; padding: 0; margin: 0; }
+  .phase-list li {
+    display: flex; align-items: flex-start; gap: 12px;
+    padding: 8px 0; border-bottom: 1px solid var(--dim);
+    font-size: .8em;
+  }
+  .phase-list li:last-child { border-bottom: none; }
+  .phase-num {
+    min-width: 28px; height: 28px; border-radius: 50%;
+    display: flex; align-items: center; justify-content: center;
+    font-size: .75em; font-weight: 700;
+    background: var(--dim); color: var(--cyan);
+    border: 1px solid var(--cyan);
+  }
+  .phase-text strong { color: #e2e8f0; }
+  .phase-text span   { color: #718096; font-size: .92em; }
+
+  /* two-col layout */
+  .two-col { display: grid; grid-template-columns: 1fr 1fr; gap: 24px; align-items: start; }
+
+  /* highlight box */
+  .callout {
+    background: rgba(0,212,255,.07);
+    border-left: 3px solid var(--cyan);
+    border-radius: 0 8px 8px 0;
+    padding: 10px 16px;
+    margin: 10px 0;
+    font-size: .8em;
+    color: #e2e8f0;
+  }
+  .callout.green  { background: rgba(72,187,120,.07); border-color: var(--green); }
+  .callout.yellow { background: rgba(246,224,94,.07);  border-color: var(--yellow); }
+  .callout.purple { background: rgba(159,122,234,.07); border-color: var(--purple); }
+
+  /* scenario header strip */
+  .scenario-header {
+    background: rgba(0,212,255,.08);
+    border: 1px solid rgba(0,212,255,.2);
+    border-radius: 8px;
+    padding: 8px 16px;
+    display: flex; align-items: center; gap: 12px;
+    margin-bottom: 14px;
+  }
+  .scenario-header .phase-badge {
+    font-size: .7em; font-weight: 700; color: var(--cyan);
+    background: rgba(0,212,255,.15); border-radius: 6px;
+    padding: 3px 8px; white-space: nowrap;
+  }
+  .scenario-header .phase-title { font-size: .85em; color: #e2e8f0; }
+
+  svg text { font-family: 'Segoe UI', system-ui, sans-serif; }
+</style>
+</head>
+<body>
+<div class="reveal">
+<div class="slides">
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 1 — Title
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <h1 style="font-size:2.2em; margin-bottom:.15em;">ToolHive Memory</h1>
+  <p style="font-size:1.1em; color:var(--cyan); margin-bottom:1.2em;">Agentic Shared Memory for Teams</p>
+  <p style="color:#718096; font-size:.8em;">
+    A persistent, queryable memory layer that any Claude Code session<br>
+    can read and write through a standard MCP interface.
+  </p>
+  <div style="margin-top:2em; font-size:.7em; color:#4a5568;">
+    <span class="tag tag-cyan">MCP</span>
+    <span class="tag tag-green">SQLite + sqlite-vec</span>
+    <span class="tag tag-purple">Ollama embeddings</span>
+    <span class="tag tag-gray">Go</span>
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 2 — The Problem
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <h2>The Problem</h2>
+  <p style="color:#718096; margin-bottom:1em;">Every agent session starts with no memory of what came before.</p>
+
+  <!-- SVG: isolated sessions -->
+  <svg viewBox="0 0 720 260" width="100%" style="max-width:680px;">
+    <defs>
+      <marker id="arr-gray" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
+        <path d="M0,0 L0,6 L8,3 z" fill="#4a5568"/>
+      </marker>
+    </defs>
+    <!-- Session boxes -->
+    <rect x="20"  y="80" width="160" height="60" rx="8" fill="#1a202c" stroke="#4a5568" stroke-width="1.5"/>
+    <text x="100" y="106" fill="#718096" font-size="11" text-anchor="middle">Claude Code</text>
+    <text x="100" y="122" fill="#a0aec0" font-size="12" font-weight="600" text-anchor="middle">Session A</text>
+
+    <rect x="20"  y="180" width="160" height="60" rx="8" fill="#1a202c" stroke="#4a5568" stroke-width="1.5"/>
+    <text x="100" y="206" fill="#718096" font-size="11" text-anchor="middle">Claude Code</text>
+    <text x="100" y="222" fill="#a0aec0" font-size="12" font-weight="600" text-anchor="middle">Session B</text>
+
+    <!-- Big X in center -->
+    <circle cx="360" cy="160" r="48" fill="#2d1f1f" stroke="#742a2a" stroke-width="1.5"/>
+    <line x1="338" y1="138" x2="382" y2="182" stroke="#fc8181" stroke-width="3" stroke-linecap="round"/>
+    <line x1="382" y1="138" x2="338" y2="182" stroke="#fc8181" stroke-width="3" stroke-linecap="round"/>
+
+    <!-- Dashed lines to X -->
+    <line x1="180" y1="110" x2="316" y2="148" stroke="#4a5568" stroke-width="1.5" stroke-dasharray="5,4" marker-end="url(#arr-gray)"/>
+    <line x1="180" y1="210" x2="316" y2="172" stroke="#4a5568" stroke-width="1.5" stroke-dasharray="5,4" marker-end="url(#arr-gray)"/>
+
+    <!-- Right side: lost knowledge -->
+    <rect x="458" y="100" width="240" height="50" rx="6" fill="#1a202c" stroke="#742a2a" stroke-width="1"/>
+    <text x="578" y="120" fill="#fc8181" font-size="11" text-anchor="middle">❌  Knowledge from Session A</text>
+    <text x="578" y="137" fill="#718096" font-size="10" text-anchor="middle">invisible to Session B</text>
+
+    <rect x="458" y="165" width="240" height="50" rx="6" fill="#1a202c" stroke="#742a2a" stroke-width="1"/>
+    <text x="578" y="185" fill="#fc8181" font-size="11" text-anchor="middle">❌  Decisions made twice</text>
+    <text x="578" y="202" fill="#718096" font-size="10" text-anchor="middle">no shared context, no continuity</text>
+
+    <!-- No-share label -->
+    <text x="360" y="224" fill="#fc8181" font-size="10" text-anchor="middle">no shared state</text>
+  </svg>
+
+  <div class="callout" style="margin-top:.6em;">
+    A recruiter learns a visa policy the hard way. The next recruiter repeats the mistake. The hiring manager has no idea where the pipeline stands.
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 3 — Architecture
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <h2>Architecture</h2>
+  <p style="color:#718096; margin-bottom:.8em;">A shared MCP server any agent session can talk to.</p>
+
+  <svg viewBox="0 0 720 300" width="100%" style="max-width:700px;">
+    <defs>
+      <marker id="arr-cyan" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
+        <path d="M0,0 L0,6 L8,3 z" fill="#00d4ff"/>
+      </marker>
+      <marker id="arr-green" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
+        <path d="M0,0 L0,6 L8,3 z" fill="#48bb78"/>
+      </marker>
+    </defs>
+
+    <!-- Sessions on left -->
+    <rect x="10"  y="30"  width="150" height="46" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="85"  y="50"  fill="#718096" font-size="10" text-anchor="middle">Claude Code</text>
+    <text x="85"  y="66"  fill="#00d4ff" font-size="12" font-weight="600" text-anchor="middle">Recruiter A</text>
+
+    <rect x="10"  y="127" width="150" height="46" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="85"  y="147" fill="#718096" font-size="10" text-anchor="middle">Claude Code</text>
+    <text x="85"  y="163" fill="#00d4ff" font-size="12" font-weight="600" text-anchor="middle">Hiring Manager</text>
+
+    <rect x="10"  y="224" width="150" height="46" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="85"  y="244" fill="#718096" font-size="10" text-anchor="middle">Claude Code</text>
+    <text x="85"  y="260" fill="#00d4ff" font-size="12" font-weight="600" text-anchor="middle">Recruiter B</text>
+
+    <!-- Arrows to Memory Server -->
+    <line x1="162" y1="53"  x2="272" y2="130" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
+    <line x1="162" y1="150" x2="272" y2="150" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
+    <line x1="162" y1="247" x2="272" y2="170" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
+    <text x="212" y="105" fill="#718096" font-size="9" text-anchor="middle">HTTP / MCP</text>
+
+    <!-- Memory Server -->
+    <rect x="278" y="98" width="180" height="104" rx="10" fill="#0d1f2d" stroke="#00d4ff" stroke-width="2"/>
+    <text x="368" y="120" fill="#00d4ff" font-size="11" font-weight="700" text-anchor="middle">Memory Server</text>
+    <line x1="298" y1="128" x2="438" y2="128" stroke="#1a3a4a" stroke-width="1"/>
+    <text x="368" y="144" fill="#718096" font-size="9.5" text-anchor="middle">memory_remember</text>
+    <text x="368" y="158" fill="#718096" font-size="9.5" text-anchor="middle">memory_search</text>
+    <text x="368" y="172" fill="#718096" font-size="9.5" text-anchor="middle">memory_crystallize</text>
+    <text x="368" y="186" fill="#718096" font-size="9.5" text-anchor="middle">+ resources / list</text>
+
+    <!-- Arrows to backends -->
+    <line x1="458" y1="125" x2="540" y2="80"  stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
+    <line x1="458" y1="150" x2="540" y2="150" stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
+    <line x1="458" y1="175" x2="540" y2="220" stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
+
+    <!-- Backends on right -->
+    <rect x="546" y="46"  width="158" height="46" rx="8" fill="#1a202c" stroke="#48bb78" stroke-width="1.5"/>
+    <text x="625" y="65"  fill="#718096" font-size="10" text-anchor="middle">SQLite + sqlite-vec</text>
+    <text x="625" y="81"  fill="#48bb78" font-size="11" font-weight="600" text-anchor="middle">Storage + Vectors</text>
+
+    <rect x="546" y="127" width="158" height="46" rx="8" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
+    <text x="625" y="146" fill="#718096" font-size="10" text-anchor="middle">goose migrations</text>
+    <text x="625" y="162" fill="#9f7aea" font-size="11" font-weight="600" text-anchor="middle">Schema Manager</text>
+
+    <rect x="546" y="208" width="158" height="46" rx="8" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
+    <text x="625" y="227" fill="#718096" font-size="10" text-anchor="middle">nomic-embed-text</text>
+    <text x="625" y="243" fill="#f6e05e" font-size="11" font-weight="600" text-anchor="middle">Ollama Embedder</text>
+  </svg>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 4 — Memory Types
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <h2>Memory Types</h2>
+  <p style="color:#718096; margin-bottom:.8em;">Four types cover everything from reference docs to learned processes.</p>
+
+  <div class="card-grid">
+    <div class="card" style="border-color:rgba(0,212,255,.3);">
+      <div class="icon">📄</div>
+      <div class="title" style="color:var(--cyan);">Resource</div>
+      <div class="desc">Read-only reference documents uploaded via REST API. Agents discover them through MCP <em>resources/list</em> or <em>memory_search</em>. Never modified by agents.</div>
+      <div style="margin-top:8px;"><span class="tag tag-cyan">source: resource</span></div>
+    </div>
+    <div class="card" style="border-color:rgba(72,187,120,.3);">
+      <div class="icon">🧠</div>
+      <div class="title" style="color:var(--green);">Semantic</div>
+      <div class="desc">Aggregated facts and domain knowledge — things that are durably true. Conflict detection prevents silent contradictions on write.</div>
+      <div style="margin-top:8px;"><span class="tag tag-green">author: human | agent</span></div>
+    </div>
+    <div class="card" style="border-color:rgba(246,224,94,.3);">
+      <div class="icon">📅</div>
+      <div class="title" style="color:var(--yellow);">Episodic</div>
+      <div class="desc">Time-indexed event records — things that <em>happened</em>. Phone screens, decisions, observations. Queryable by time range and tags.</div>
+      <div style="margin-top:8px;"><span class="tag tag-yellow">e.g. "Alice Chen screened 2024-03-10"</span></div>
+    </div>
+    <div class="card" style="border-color:rgba(159,122,234,.3);">
+      <div class="icon">🔧</div>
+      <div class="title" style="color:var(--purple);">Procedural</div>
+      <div class="desc">Learned behaviors and processes — how to do things. Emerges from episodic patterns. Can be <em>crystallized</em> into a versioned Skill runbook.</div>
+      <div style="margin-top:8px;"><span class="tag tag-purple">crystallizable → Skill</span></div>
+    </div>
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 5 — Memory Lifecycle
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <h2>Memory Lifecycle</h2>
+  <p style="color:#718096; margin-bottom:.8em;">Memory is managed — not just stored.</p>
+
+  <svg viewBox="0 0 720 200" width="100%" style="max-width:700px;">
+    <defs>
+      <marker id="arr-lc" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
+        <path d="M0,0 L0,6 L8,3 z" fill="#4a5568"/>
+      </marker>
+      <marker id="arr-crystal" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
+        <path d="M0,0 L0,6 L8,3 z" fill="#9f7aea"/>
+      </marker>
+    </defs>
+
+    <!-- Nodes -->
+    <!-- Remember -->
+    <rect x="10"  y="70" width="110" height="52" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="65"  y="92"  fill="#00d4ff" font-size="11" font-weight="700" text-anchor="middle">Remember</text>
+    <text x="65"  y="108" fill="#718096" font-size="9" text-anchor="middle">embed + conflict check</text>
+
+    <!-- Search -->
+    <rect x="160" y="70" width="110" height="52" rx="8" fill="#1a202c" stroke="#48bb78" stroke-width="1.5"/>
+    <text x="215" y="92"  fill="#48bb78" font-size="11" font-weight="700" text-anchor="middle">Search</text>
+    <text x="215" y="108" fill="#718096" font-size="9" text-anchor="middle">vector + trust-weighted</text>
+
+    <!-- Flag / Update -->
+    <rect x="310" y="70" width="110" height="52" rx="8" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
+    <text x="365" y="92"  fill="#f6e05e" font-size="11" font-weight="700" text-anchor="middle">Flag / Update</text>
+    <text x="365" y="108" fill="#718096" font-size="9" text-anchor="middle">correct or mark stale</text>
+
+    <!-- Consolidate -->
+    <rect x="460" y="70" width="110" height="52" rx="8" fill="#1a202c" stroke="#ed8936" stroke-width="1.5"/>
+    <text x="515" y="92"  fill="#ed8936" font-size="11" font-weight="700" text-anchor="middle">Consolidate</text>
+    <text x="515" y="108" fill="#718096" font-size="9" text-anchor="middle">merge related entries</text>
+
+    <!-- Crystallize -->
+    <rect x="610" y="70" width="100" height="52" rx="8" fill="#1a202c" stroke="#9f7aea" stroke-width="2"/>
+    <text x="660" y="92"  fill="#9f7aea" font-size="11" font-weight="700" text-anchor="middle">Crystallize</text>
+    <text x="660" y="108" fill="#718096" font-size="9" text-anchor="middle">→ Skill runbook</text>
+
+    <!-- Arrows -->
+    <line x1="120" y1="96" x2="157" y2="96" stroke="#4a5568" stroke-width="1.5" marker-end="url(#arr-lc)"/>
+    <line x1="270" y1="96" x2="307" y2="96" stroke="#4a5568" stroke-width="1.5" marker-end="url(#arr-lc)"/>
+    <line x1="420" y1="96" x2="457" y2="96" stroke="#4a5568" stroke-width="1.5" marker-end="url(#arr-lc)"/>
+    <line x1="570" y1="96" x2="607" y2="96" stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-crystal)"/>
+
+    <!-- Trust/staleness note -->
+    <rect x="130" y="158" width="460" height="30" rx="6" fill="rgba(0,212,255,.05)" stroke="rgba(0,212,255,.2)" stroke-width="1"/>
+    <text x="360" y="178" fill="#718096" font-size="10" text-anchor="middle">
+      Background job every 24h: recomputes trust &amp; staleness scores, expires TTL'd entries, surfaces consolidation candidates
+    </text>
+  </svg>
+
+  <div class="two-col" style="margin-top:.6em;">
+    <div class="callout">
+      <strong>Trust score</strong> — author weight × age decay × correction penalty × flag penalty
+    </div>
+    <div class="callout">
+      <strong>Conflict detection</strong> — cosine similarity &gt; 0.85 on write returns conflicts; agent decides
+    </div>
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 6 — Skills Integration
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <h2>From Memory to Skill</h2>
+  <p style="color:#718096; margin-bottom:.8em;">Fluid procedural knowledge crystallizes into versioned, distributable runbooks.</p>
+
+  <svg viewBox="0 0 680 180" width="100%" style="max-width:660px;">
+    <defs>
+      <marker id="arr-sk" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
+        <path d="M0,0 L0,6 L8,3 z" fill="#9f7aea"/>
+      </marker>
+      <marker id="arr-sk2" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
+        <path d="M0,0 L0,6 L8,3 z" fill="#48bb78"/>
+      </marker>
+    </defs>
+
+    <!-- Procedural memories -->
+    <rect x="10"  y="30"  width="155" height="36" rx="6" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
+    <text x="87"  y="53"  fill="#9f7aea" font-size="11" font-weight="600" text-anchor="middle">🔧 Procedural memories</text>
+
+    <rect x="10"  y="80"  width="155" height="36" rx="6" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
+    <text x="87"  y="103" fill="#9f7aea" font-size="11" font-weight="600" text-anchor="middle">🔧 Procedural memories</text>
+
+    <rect x="10"  y="130" width="155" height="36" rx="6" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
+    <text x="87"  y="153" fill="#9f7aea" font-size="11" font-weight="600" text-anchor="middle">🔧 Procedural memories</text>
+
+    <!-- Crystallize -->
+    <line x1="166" y1="48"  x2="254" y2="88"  stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-sk)"/>
+    <line x1="166" y1="98"  x2="254" y2="98"  stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-sk)"/>
+    <line x1="166" y1="148" x2="254" y2="108" stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-sk)"/>
+
+    <rect x="260" y="68" width="140" height="60" rx="8" fill="#0d1f2d" stroke="#9f7aea" stroke-width="2"/>
+    <text x="330" y="93"  fill="#9f7aea" font-size="11" font-weight="700" text-anchor="middle">memory_crystallize</text>
+    <text x="330" y="110" fill="#718096" font-size="9.5" text-anchor="middle">drafts SKILL.md scaffold</text>
+    <text x="330" y="123" fill="#718096" font-size="9.5" text-anchor="middle">human authors + pushes</text>
+
+    <!-- Arrow to Skill OCI -->
+    <line x1="402" y1="98" x2="484" y2="98" stroke="#48bb78" stroke-width="2" marker-end="url(#arr-sk2)"/>
+
+    <!-- Skill -->
+    <rect x="490" y="68" width="180" height="60" rx="8" fill="#1a202c" stroke="#48bb78" stroke-width="2"/>
+    <text x="580" y="90"  fill="#48bb78" font-size="11" font-weight="700" text-anchor="middle">Skill (OCI artifact)</text>
+    <text x="580" y="107" fill="#718096" font-size="9.5" text-anchor="middle">versioned · immutable</text>
+    <text x="580" y="120" fill="#718096" font-size="9.5" text-anchor="middle">distributable across teams</text>
+
+    <!-- crystallized_into label on originals -->
+    <text x="87" y="180" fill="#4a5568" font-size="9" text-anchor="middle">archived with crystallized_into pointer</text>
+  </svg>
+
+  <div class="callout purple" style="margin-top:.5em;">
+    Procedural memories and Skills are the same knowledge at different stages — fluid and evolving in memory, crystallized and versioned as a Skill.
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 7 — Demo Title
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <div style="margin-bottom:.6em;">
+    <span class="tag tag-cyan" style="font-size:.85em;">Live Demo</span>
+  </div>
+  <h1 style="font-size:2em; margin-bottom:.2em;">The Recruiter</h1>
+  <p style="font-size:1em; color:#a0aec0; margin-bottom:1.4em;">Hiring a Senior Go Engineer at Stacklok</p>
+
+  <div class="two-col" style="max-width:620px; margin:0 auto;">
+    <div style="text-align:left;">
+      <p style="font-size:.8em; color:#718096; margin-bottom:.4em;">Cast</p>
+      <div style="font-size:.82em; line-height:2;">
+        👩 <strong>Recruiter</strong> — runs phone screens<br>
+        🧑‍💼 <strong>Hiring Manager</strong> — checks pipeline cold<br>
+        🖥️ <strong>Memory Server</strong> — shared between all sessions
+      </div>
+    </div>
+    <div style="text-align:left;">
+      <p style="font-size:.8em; color:#718096; margin-bottom:.4em;">What we'll see</p>
+      <div style="font-size:.82em; line-height:2;">
+        ✅ Cross-session knowledge sharing<br>
+        ✅ Policy recalled without being told<br>
+        ✅ Process learned from failure<br>
+        ✅ Runbook born from experience
+      </div>
+    </div>
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 8 — Demo Overview (all phases)
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <h2>Scenario Overview</h2>
+  <ul class="phase-list">
+    <li>
+      <div class="phase-num">1</div>
+      <div class="phase-text">
+        <strong>Resource</strong> &nbsp;<span class="tag tag-cyan">resource</span><br>
+        <span>Upload job description as a read-only MCP Resource — agents can discover it via memory_search</span>
+      </div>
+    </li>
+    <li>
+      <div class="phase-num">2</div>
+      <div class="phase-text">
+        <strong>Semantic Memory</strong> &nbsp;<span class="tag tag-green">semantic</span><br>
+        <span>Prime 3 company-wide facts: no visa sponsorship, salary band $100–150K, remote US async culture</span>
+      </div>
+    </li>
+    <li>
+      <div class="phase-num">3</div>
+      <div class="phase-text">
+        <strong>Recruiter — Alice Chen</strong> &nbsp;<span class="tag tag-yellow">episodic</span><br>
+        <span>Strong candidate, needs H1-B. Agent searches policy, finds the blocker, logs the outcome</span>
+      </div>
+    </li>
+    <li>
+      <div class="phase-num">4</div>
+      <div class="phase-text">
+        <strong>Hiring Manager — cold search</strong> &nbsp;<span class="tag tag-green">semantic</span> <span class="tag tag-yellow">episodic</span><br>
+        <span>Joins cold. Searches pipeline, comp, JD — gets a full picture from memory alone</span>
+      </div>
+    </li>
+    <li>
+      <div class="phase-num">5</div>
+      <div class="phase-text">
+        <strong>Recruiter — Bob Martinez</strong> &nbsp;<span class="tag tag-yellow">episodic</span> <span class="tag tag-purple">procedural</span><br>
+        <span>Bob archived. Recruiter notices a pattern → writes a procedural memory for next screens</span>
+      </div>
+    </li>
+    <li>
+      <div class="phase-num">6</div>
+      <div class="phase-text">
+        <strong>Recruiter — Charlie Kim</strong> &nbsp;<span class="tag tag-purple">procedural</span> <span class="tag tag-yellow">episodic</span><br>
+        <span>Retrieves the checklist before the screen. Applies it. Charlie advances to the full loop.</span>
+      </div>
+    </li>
+    <li>
+      <div class="phase-num">7</div>
+      <div class="phase-text">
+        <strong>Crystallize → Skill</strong> &nbsp;<span class="tag tag-purple">procedural</span><br>
+        <span>One week of screens → crystallize → phone-screen runbook the whole team can reuse</span>
+      </div>
+    </li>
+  </ul>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 9 — Phase 1-2: Setup
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <div class="scenario-header">
+    <div class="phase-badge">Phases 1 – 2</div>
+    <div class="phase-title">Setup — prime the memory server</div>
+  </div>
+
+  <div class="two-col">
+    <div>
+      <p style="font-size:.8em; color:#718096; margin-bottom:.5em;">Phase 1 · Resource</p>
+      <div class="callout" style="font-size:.78em;">
+        <code style="color:var(--cyan);">POST /api/resources</code><br><br>
+        Job description uploaded as a <strong>read-only MCP Resource</strong>.<br>
+        Agents discover it via <code>memory_search</code> or <code>resources/list</code>.<br>
+        Cannot be modified or deleted by any agent.
+      </div>
+    </div>
+    <div>
+      <p style="font-size:.8em; color:#718096; margin-bottom:.5em;">Phase 2 · Semantic Memory</p>
+      <div class="callout green" style="font-size:.78em; margin-bottom:6px;">
+        🧠 &nbsp;Company does not sponsor US work visas for any engineering role
+      </div>
+      <div class="callout green" style="font-size:.78em; margin-bottom:6px;">
+        🧠 &nbsp;Senior Go Engineer base: $100K–$150K + equity
+      </div>
+      <div class="callout green" style="font-size:.78em;">
+        🧠 &nbsp;Engineering team fully remote, US timezone, async-first
+      </div>
+    </div>
+  </div>
+  <p style="font-size:.74em; color:#4a5568; margin-top:.8em;">Written once by the setup script — recalled by any agent session at any time.</p>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 10 — Phase 3: Alice
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <div class="scenario-header">
+    <div class="phase-badge">Phase 3</div>
+    <div class="phase-title">Recruiter Session — Alice Chen phone screen</div>
+  </div>
+
+  <div class="two-col">
+    <div>
+      <p style="font-size:.78em; color:#718096; margin-bottom:.4em;">The recruiter says</p>
+      <div style="background:#1a202c; border-radius:8px; padding:12px 14px; font-size:.78em; color:#a0aec0; font-style:italic; line-height:1.6; border:1px solid #2d3748;">
+        "She mentioned she's on OPT and would need an H1-B transfer. Before I move her forward, I want to make sure that's not a blocker. Can you check if we have any policy on that?"
+      </div>
+    </div>
+    <div>
+      <p style="font-size:.78em; color:#718096; margin-bottom:.4em;">What the agent does</p>
+      <div style="font-size:.78em; line-height:1.8;">
+        <div style="color:#48bb78;">→ <code>memory_search("visa sponsorship policy")</code></div>
+        <div style="color:#718096; padding-left:16px; margin-bottom:6px;">Finds: "Company does not sponsor US work visas"</div>
+        <div style="color:#f6e05e;">→ <code>memory_remember</code> (episodic)</div>
+        <div style="color:#718096; padding-left:16px;">Alice Chen — OPT, needs H1-B → archived</div>
+      </div>
+    </div>
+  </div>
+
+  <div class="callout yellow" style="margin-top:.8em; font-size:.8em;">
+    The agent found a policy it was never told about in this session — it came from shared memory written in Phase 2.
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 11 — Phase 4: Hiring Manager
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <div class="scenario-header">
+    <div class="phase-badge">Phase 4</div>
+    <div class="phase-title">Hiring Manager — cold search</div>
+  </div>
+
+  <p style="font-size:.8em; color:#718096; margin-bottom:.6em; font-style:italic;">
+    "I haven't been in the loop on recruiting — can you catch me up? I'd like to know who's been screened, where they stand, the approved comp range, and a reminder of what we're hiring for."
+  </p>
+
+  <div class="card-grid">
+    <div class="card" style="border-color:rgba(72,187,120,.3);">
+      <div class="title" style="color:var(--green); font-size:.78em;">memory_search("candidates screened")</div>
+      <div class="desc">Finds Alice Chen → archived (visa). Pipeline: 1 of 1 archived.</div>
+    </div>
+    <div class="card" style="border-color:rgba(72,187,120,.3);">
+      <div class="title" style="color:var(--green); font-size:.78em;">memory_search("visa sponsorship")</div>
+      <div class="desc">Confirms no-sponsorship policy. Explains why Alice was archived.</div>
+    </div>
+    <div class="card" style="border-color:rgba(72,187,120,.3);">
+      <div class="title" style="color:var(--green); font-size:.78em;">memory_search("salary compensation")</div>
+      <div class="desc">$100K–$150K base + equity. Approved band retrieved.</div>
+    </div>
+    <div class="card" style="border-color:rgba(0,212,255,.3);">
+      <div class="title" style="color:var(--cyan); font-size:.78em;">memory_search("job description")</div>
+      <div class="desc">Retrieves the JD Resource. Full role requirements surfaced.</div>
+    </div>
+  </div>
+  <p style="font-size:.72em; color:#4a5568; margin-top:.6em;">The hiring manager never spoke to the recruiter. The memory server was the handoff.</p>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 12 — Phase 5: Bob + Procedural
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <div class="scenario-header">
+    <div class="phase-badge">Phase 5</div>
+    <div class="phase-title">Recruiter Session — Bob Martinez + a lesson learned</div>
+  </div>
+
+  <div class="two-col">
+    <div>
+      <div style="font-size:.78em; color:#a0aec0; font-style:italic; background:#1a202c; padding:12px; border-radius:8px; border:1px solid #2d3748; line-height:1.6;">
+        "…this is the second screen in a row where something obvious knocked the candidate out early. I feel like we could save everyone time if we checked those things right at the start of each call. Worth noting that pattern somewhere."
+      </div>
+    </div>
+    <div>
+      <div class="callout purple" style="font-size:.78em;">
+        <strong>🔧 Procedural memory written</strong><br><br>
+        "Phone screen gate: (1) confirm work-auth in first 5 min, (2) ask candidate to explain Raft — weak answers correlate strongly with underperformance."
+      </div>
+    </div>
+  </div>
+
+  <div class="callout yellow" style="margin-top:.8em; font-size:.8em;">
+    The recruiter didn't say "write a procedural memory." The agent recognized it as a reusable process and chose the right memory type.
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 13 — Phase 6: Charlie
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <div class="scenario-header">
+    <div class="phase-badge">Phase 6</div>
+    <div class="phase-title">Recruiter Session — Charlie Kim</div>
+  </div>
+
+  <div class="two-col">
+    <div>
+      <p style="font-size:.78em; color:#718096; margin-bottom:.4em;"><em>Before the screen</em></p>
+      <div style="font-size:.78em; color:#a0aec0; font-style:italic; background:#1a202c; padding:12px; border-radius:8px; border:1px solid #2d3748; line-height:1.6;">
+        "About to jump on a screen with Charlie Kim. Do we have anything on how to run these calls?"
+      </div>
+      <div style="margin-top:10px; font-size:.78em; color:#48bb78;">
+        → <code>memory_search("phone screen process")</code><br>
+        <span style="color:#718096; padding-left:16px;">Retrieves the checklist from Phase 5</span>
+      </div>
+    </div>
+    <div>
+      <p style="font-size:.78em; color:#718096; margin-bottom:.4em;"><em>After the screen</em></p>
+      <div class="callout green" style="font-size:.77em; margin-bottom:6px;">
+        ✅ US citizen — work-auth clear (first question)
+      </div>
+      <div class="callout green" style="font-size:.77em; margin-bottom:6px;">
+        ✅ $140K ask — within the $100–150K band
+      </div>
+      <div class="callout green" style="font-size:.77em;">
+        ✅ Explained Raft + leader election edge cases unprompted
+      </div>
+      <p style="font-size:.75em; color:#48bb78; margin-top:.6em; font-weight:600;">→ Advancing to interview loop</p>
+    </div>
+  </div>
+
+  <div class="callout" style="margin-top:.6em; font-size:.78em;">
+    The checklist was written by a <em>different agent session</em>. This session retrieved and applied it.
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 14 — Phase 7: Crystallize
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <div class="scenario-header">
+    <div class="phase-badge">Phase 7</div>
+    <div class="phase-title">Crystallize — phone-screen pattern → reusable Skill</div>
+  </div>
+
+  <div style="font-size:.78em; color:#a0aec0; font-style:italic; background:#1a202c; padding:10px 14px; border-radius:8px; border:1px solid #2d3748; margin-bottom:.8em;">
+    "We've wrapped the first week of screens. I want to turn what we learned into something the whole recruiting team can reuse — a proper runbook for future phone screens."
+  </div>
+
+  <div class="two-col">
+    <div style="font-size:.78em; color:#a0aec0;">
+      <div style="color:#9f7aea; margin-bottom:4px;">Agent retrieves</div>
+      <div style="color:#718096; line-height:1.8;">
+        → <code>memory_list(type=procedural)</code><br>
+        → <code>memory_search("phone screen patterns")</code><br>
+        → <code>memory_crystallize([ids…])</code>
+      </div>
+    </div>
+    <div>
+      <div class="callout purple" style="font-size:.76em; line-height:1.6;">
+        <strong>Output: SKILL.md scaffold</strong><br>
+        Knockout gates · Technical depth probe<br>
+        Decision rubric · Post-call logging template<br><br>
+        Human authors it → <code>thv skills push</code> → OCI artifact.<br>
+        Procedural memories archived with <code>crystallized_into</code> pointer.
+      </div>
+    </div>
+  </div>
+
+  <p style="font-size:.72em; color:#4a5568; margin-top:.6em;">One week of lived experience → a versioned, distributable runbook any recruiter can follow.</p>
+</section>
+
+<!-- ══════════════════════════════════════════════════════════════
+     SLIDE 15 — Summary
+     ══════════════════════════════════════════════════════════════ -->
+<section>
+  <h2>What We Just Saw</h2>
+
+  <ul class="phase-list" style="margin-top:.4em;">
+    <li>
+      <div class="phase-num" style="background:rgba(0,212,255,.1);">📄</div>
+      <div class="phase-text">
+        <strong>Resources</strong> — reference docs agents discover through MCP; never modified by agents
+      </div>
+    </li>
+    <li>
+      <div class="phase-num" style="background:rgba(72,187,120,.1);">🧠</div>
+      <div class="phase-text">
+        <strong>Semantic memory</strong> — company-wide facts written once, recalled by any session
+      </div>
+    </li>
+    <li>
+      <div class="phase-num" style="background:rgba(246,224,94,.1);">📅</div>
+      <div class="phase-text">
+        <strong>Episodic memory</strong> — time-indexed events building a shared pipeline log
+      </div>
+    </li>
+    <li>
+      <div class="phase-num" style="background:rgba(159,122,234,.1);">🔧</div>
+      <div class="phase-text">
+        <strong>Procedural memory</strong> — process knowledge that emerged from failure, retrieved by a different session
+      </div>
+    </li>
+    <li>
+      <div class="phase-num" style="background:rgba(159,122,234,.1);">✨</div>
+      <div class="phase-text">
+        <strong>Crystallization</strong> — lived experience promoted into a versioned Skill runbook the whole team can use
+      </div>
+    </li>
+  </ul>
+
+  <div class="callout" style="margin-top:.8em; font-size:.82em; text-align:center;">
+    Any Claude Code session. One MCP config file. Shared memory across the whole team.
+  </div>
+</section>
+
+</div><!-- .slides -->
+</div><!-- .reveal -->
+
+<script src="https://cdn.jsdelivr.net/npm/reveal.js@5.1.0/dist/reveal.js"></script>
+<script>
+  Reveal.initialize({
+    hash: true,
+    controls: true,
+    progress: true,
+    slideNumber: true,
+    transition: 'slide',
+    transitionSpeed: 'fast',
+    backgroundTransition: 'none',
+    width: 1100,
+    height: 680,
+    margin: 0.06,
+  });
+</script>
+</body>
+</html>

From e37b1dad3df40c9e19b523999eec37864a523cf6 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Tue, 28 Apr 2026 18:39:14 -0400
Subject: [PATCH 15/23] Expand slides: research, compare table, references, fix
 layout
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add part dividers to structure narrative (Problem → Architecture → Demo)
- Add "What Research Tells Us" slide with 3 sources
- Add comparison table: LinkedIn CMA vs ToolHive Memory
- Add References slide with full citations for all three sources
- Fix memory types slide — replace 2x2 card grid with compact rows
  that no longer overflow the slide
- Set center:false so slides don't jump vertically between content sizes

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/slides.html | 876 ++++++++++++++++++++-----------------
 1 file changed, 484 insertions(+), 392 deletions(-)

diff --git a/demo/recruiter/slides.html b/demo/recruiter/slides.html
index 5ac4f0f757..8efed57963 100644
--- a/demo/recruiter/slides.html
+++ b/demo/recruiter/slides.html
@@ -12,97 +12,119 @@
     --green:  #48bb78;
     --yellow: #f6e05e;
     --purple: #9f7aea;
+    --orange: #ed8936;
     --gray:   #718096;
     --dim:    #2d3748;
   }
 
   .reveal { font-family: 'Segoe UI', system-ui, sans-serif; }
 
-  /* headings */
-  .reveal h1 { color: var(--cyan); font-size: 1.9em; margin-bottom: .3em; }
-  .reveal h2 { color: var(--cyan); font-size: 1.4em; margin-bottom: .4em; }
-  .reveal h3 { color: #e2e8f0; font-size: 1.1em; }
-  .reveal p, .reveal li { color: #cbd5e0; font-size: .88em; }
+  .reveal h1 { color: var(--cyan); font-size: 1.85em; margin-bottom: .25em; }
+  .reveal h2 { color: var(--cyan); font-size: 1.3em;  margin-bottom: .35em; }
+  .reveal p, .reveal li { color: #cbd5e0; font-size: .86em; }
 
-  /* tag pill */
   .tag {
     display: inline-block;
-    padding: 2px 10px;
+    padding: 2px 9px;
     border-radius: 9999px;
-    font-size: .68em;
+    font-size: .65em;
     font-weight: 600;
     letter-spacing: .04em;
     margin-right: 4px;
   }
-  .tag-cyan   { background: rgba(0,212,255,.15); color: var(--cyan);   border: 1px solid var(--cyan); }
+  .tag-cyan   { background: rgba(0,212,255,.15);  color: var(--cyan);   border: 1px solid var(--cyan); }
   .tag-green  { background: rgba(72,187,120,.15); color: var(--green);  border: 1px solid var(--green); }
   .tag-yellow { background: rgba(246,224,94,.15); color: var(--yellow); border: 1px solid var(--yellow); }
-  .tag-purple { background: rgba(159,122,234,.15); color: var(--purple); border: 1px solid var(--purple); }
-  .tag-gray   { background: rgba(113,128,150,.15); color: #a0aec0;      border: 1px solid var(--gray); }
+  .tag-purple { background: rgba(159,122,234,.15);color: var(--purple); border: 1px solid var(--purple); }
+  .tag-gray   { background: rgba(113,128,150,.15);color: #a0aec0;       border: 1px solid var(--gray); }
 
-  /* memory type cards */
-  .card-grid { display: grid; grid-template-columns: 1fr 1fr; gap: 16px; margin-top: 12px; }
-  .card {
-    background: rgba(255,255,255,.05);
-    border: 1px solid rgba(255,255,255,.1);
-    border-radius: 10px;
-    padding: 16px 18px;
-    text-align: left;
+  /* compact memory type rows */
+  .type-row {
+    display: flex; align-items: flex-start; gap: 14px;
+    padding: 9px 12px;
+    border-radius: 8px;
+    margin-bottom: 7px;
+    background: rgba(255,255,255,.04);
+    border: 1px solid rgba(255,255,255,.08);
   }
-  .card .icon { font-size: 1.5em; }
-  .card .title { font-size: .85em; font-weight: 700; margin: 6px 0 4px; }
-  .card .desc  { font-size: .72em; color: #718096; line-height: 1.4; }
+  .type-icon  { font-size: 1.3em; min-width: 28px; }
+  .type-label { font-size: .8em; font-weight: 700; margin-bottom: 2px; }
+  .type-desc  { font-size: .72em; color: #718096; line-height: 1.35; }
+
+  /* two-col */
+  .two-col { display: grid; grid-template-columns: 1fr 1fr; gap: 20px; align-items: start; }
+
+  /* callout */
+  .callout {
+    background: rgba(0,212,255,.06);
+    border-left: 3px solid var(--cyan);
+    border-radius: 0 7px 7px 0;
+    padding: 8px 14px;
+    margin: 7px 0;
+    font-size: .78em;
+    color: #e2e8f0;
+    line-height: 1.5;
+  }
+  .callout.green  { background: rgba(72,187,120,.06);  border-color: var(--green); }
+  .callout.yellow { background: rgba(246,224,94,.06);  border-color: var(--yellow); }
+  .callout.purple { background: rgba(159,122,234,.06); border-color: var(--purple); }
+  .callout.orange { background: rgba(237,137,54,.06);  border-color: var(--orange); }
 
   /* phase list */
   .phase-list { list-style: none; padding: 0; margin: 0; }
   .phase-list li {
-    display: flex; align-items: flex-start; gap: 12px;
-    padding: 8px 0; border-bottom: 1px solid var(--dim);
-    font-size: .8em;
+    display: flex; align-items: flex-start; gap: 11px;
+    padding: 6px 0; border-bottom: 1px solid var(--dim);
+    font-size: .78em;
   }
   .phase-list li:last-child { border-bottom: none; }
   .phase-num {
-    min-width: 28px; height: 28px; border-radius: 50%;
+    min-width: 26px; height: 26px; border-radius: 50%;
     display: flex; align-items: center; justify-content: center;
-    font-size: .75em; font-weight: 700;
+    font-size: .72em; font-weight: 700; flex-shrink: 0;
     background: var(--dim); color: var(--cyan);
     border: 1px solid var(--cyan);
   }
   .phase-text strong { color: #e2e8f0; }
   .phase-text span   { color: #718096; font-size: .92em; }
 
-  /* two-col layout */
-  .two-col { display: grid; grid-template-columns: 1fr 1fr; gap: 24px; align-items: start; }
-
-  /* highlight box */
-  .callout {
-    background: rgba(0,212,255,.07);
-    border-left: 3px solid var(--cyan);
-    border-radius: 0 8px 8px 0;
-    padding: 10px 16px;
-    margin: 10px 0;
-    font-size: .8em;
-    color: #e2e8f0;
-  }
-  .callout.green  { background: rgba(72,187,120,.07); border-color: var(--green); }
-  .callout.yellow { background: rgba(246,224,94,.07);  border-color: var(--yellow); }
-  .callout.purple { background: rgba(159,122,234,.07); border-color: var(--purple); }
-
   /* scenario header strip */
   .scenario-header {
-    background: rgba(0,212,255,.08);
+    background: rgba(0,212,255,.07);
     border: 1px solid rgba(0,212,255,.2);
-    border-radius: 8px;
-    padding: 8px 16px;
-    display: flex; align-items: center; gap: 12px;
-    margin-bottom: 14px;
+    border-radius: 7px;
+    padding: 6px 14px;
+    display: flex; align-items: center; gap: 10px;
+    margin-bottom: 12px;
   }
   .scenario-header .phase-badge {
-    font-size: .7em; font-weight: 700; color: var(--cyan);
-    background: rgba(0,212,255,.15); border-radius: 6px;
-    padding: 3px 8px; white-space: nowrap;
+    font-size: .68em; font-weight: 700; color: var(--cyan);
+    background: rgba(0,212,255,.14); border-radius: 5px;
+    padding: 3px 7px; white-space: nowrap;
+  }
+  .scenario-header .phase-title { font-size: .82em; color: #e2e8f0; }
+
+  /* ref card */
+  .ref-card {
+    background: rgba(255,255,255,.04);
+    border: 1px solid rgba(255,255,255,.1);
+    border-radius: 8px;
+    padding: 12px 14px;
+    font-size: .74em;
+    line-height: 1.5;
+  }
+  .ref-card .ref-title { color: #e2e8f0; font-weight: 600; margin-bottom: 3px; }
+  .ref-card .ref-venue { color: var(--cyan); font-size: .88em; }
+  .ref-card .ref-note  { color: #718096; font-size: .88em; margin-top: 4px; }
+
+  /* section divider styling */
+  .divider-slide { text-align: center; }
+  .divider-label {
+    display: inline-block;
+    font-size: .72em; font-weight: 700; letter-spacing: .12em; text-transform: uppercase;
+    color: var(--gray); border: 1px solid var(--dim);
+    border-radius: 6px; padding: 4px 14px; margin-bottom: .8em;
   }
-  .scenario-header .phase-title { font-size: .85em; color: #e2e8f0; }
 
   svg text { font-family: 'Segoe UI', system-ui, sans-serif; }
 </style>
@@ -111,17 +133,15 @@
 <div class="reveal">
 <div class="slides">
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 1 — Title
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 1 · Title ══ -->
 <section>
-  <h1 style="font-size:2.2em; margin-bottom:.15em;">ToolHive Memory</h1>
-  <p style="font-size:1.1em; color:var(--cyan); margin-bottom:1.2em;">Agentic Shared Memory for Teams</p>
-  <p style="color:#718096; font-size:.8em;">
+  <h1 style="font-size:2.1em; margin-bottom:.15em;">ToolHive Memory</h1>
+  <p style="font-size:1em; color:var(--cyan); margin-bottom:1.1em;">Agentic Shared Memory for Teams</p>
+  <p style="color:#718096; font-size:.8em; max-width:560px; margin:0 auto 1.4em;">
     A persistent, queryable memory layer that any Claude Code session<br>
-    can read and write through a standard MCP interface.
+    can read and write — through a standard MCP interface.
   </p>
-  <div style="margin-top:2em; font-size:.7em; color:#4a5568;">
+  <div style="font-size:.7em;">
     <span class="tag tag-cyan">MCP</span>
     <span class="tag tag-green">SQLite + sqlite-vec</span>
     <span class="tag tag-purple">Ollama embeddings</span>
@@ -129,64 +149,156 @@ <h1 style="font-size:2.2em; margin-bottom:.15em;">ToolHive Memory</h1>
   </div>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 2 — The Problem
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ PART 1 DIVIDER ══ -->
+<section class="divider-slide">
+  <div class="divider-label">Part 1</div>
+  <h1 style="font-size:1.7em;">The Problem &amp; the Research</h1>
+  <p style="color:#718096; font-size:.85em; margin-top:.4em;">
+    Why agentic memory is hard, and what the research tells us to do about it.
+  </p>
+</section>
+
+<!-- ══════════════════════════════════════ 2 · The Problem ══ -->
 <section>
   <h2>The Problem</h2>
-  <p style="color:#718096; margin-bottom:1em;">Every agent session starts with no memory of what came before.</p>
+  <p style="color:#718096; margin-bottom:.7em;">Every agent session starts with no memory of what came before.</p>
 
-  <!-- SVG: isolated sessions -->
-  <svg viewBox="0 0 720 260" width="100%" style="max-width:680px;">
+  <svg viewBox="0 0 700 230" width="100%" style="max-width:660px; display:block; margin:0 auto;">
     <defs>
       <marker id="arr-gray" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
         <path d="M0,0 L0,6 L8,3 z" fill="#4a5568"/>
       </marker>
     </defs>
-    <!-- Session boxes -->
-    <rect x="20"  y="80" width="160" height="60" rx="8" fill="#1a202c" stroke="#4a5568" stroke-width="1.5"/>
-    <text x="100" y="106" fill="#718096" font-size="11" text-anchor="middle">Claude Code</text>
-    <text x="100" y="122" fill="#a0aec0" font-size="12" font-weight="600" text-anchor="middle">Session A</text>
-
-    <rect x="20"  y="180" width="160" height="60" rx="8" fill="#1a202c" stroke="#4a5568" stroke-width="1.5"/>
-    <text x="100" y="206" fill="#718096" font-size="11" text-anchor="middle">Claude Code</text>
-    <text x="100" y="222" fill="#a0aec0" font-size="12" font-weight="600" text-anchor="middle">Session B</text>
-
-    <!-- Big X in center -->
-    <circle cx="360" cy="160" r="48" fill="#2d1f1f" stroke="#742a2a" stroke-width="1.5"/>
-    <line x1="338" y1="138" x2="382" y2="182" stroke="#fc8181" stroke-width="3" stroke-linecap="round"/>
-    <line x1="382" y1="138" x2="338" y2="182" stroke="#fc8181" stroke-width="3" stroke-linecap="round"/>
-
-    <!-- Dashed lines to X -->
-    <line x1="180" y1="110" x2="316" y2="148" stroke="#4a5568" stroke-width="1.5" stroke-dasharray="5,4" marker-end="url(#arr-gray)"/>
-    <line x1="180" y1="210" x2="316" y2="172" stroke="#4a5568" stroke-width="1.5" stroke-dasharray="5,4" marker-end="url(#arr-gray)"/>
-
-    <!-- Right side: lost knowledge -->
-    <rect x="458" y="100" width="240" height="50" rx="6" fill="#1a202c" stroke="#742a2a" stroke-width="1"/>
-    <text x="578" y="120" fill="#fc8181" font-size="11" text-anchor="middle">❌  Knowledge from Session A</text>
-    <text x="578" y="137" fill="#718096" font-size="10" text-anchor="middle">invisible to Session B</text>
-
-    <rect x="458" y="165" width="240" height="50" rx="6" fill="#1a202c" stroke="#742a2a" stroke-width="1"/>
-    <text x="578" y="185" fill="#fc8181" font-size="11" text-anchor="middle">❌  Decisions made twice</text>
-    <text x="578" y="202" fill="#718096" font-size="10" text-anchor="middle">no shared context, no continuity</text>
-
-    <!-- No-share label -->
-    <text x="360" y="224" fill="#fc8181" font-size="10" text-anchor="middle">no shared state</text>
+    <rect x="10"  y="60"  width="155" height="52" rx="8" fill="#1a202c" stroke="#4a5568" stroke-width="1.5"/>
+    <text x="87"  y="82"  fill="#718096" font-size="10" text-anchor="middle">Claude Code</text>
+    <text x="87"  y="98"  fill="#a0aec0" font-size="12" font-weight="600" text-anchor="middle">Recruiter A</text>
+
+    <rect x="10"  y="165" width="155" height="52" rx="8" fill="#1a202c" stroke="#4a5568" stroke-width="1.5"/>
+    <text x="87"  y="187" fill="#718096" font-size="10" text-anchor="middle">Claude Code</text>
+    <text x="87"  y="203" fill="#a0aec0" font-size="12" font-weight="600" text-anchor="middle">Hiring Manager</text>
+
+    <circle cx="340" cy="138" r="44" fill="#2d1f1f" stroke="#742a2a" stroke-width="1.5"/>
+    <line x1="320" y1="118" x2="360" y2="158" stroke="#fc8181" stroke-width="3" stroke-linecap="round"/>
+    <line x1="360" y1="118" x2="320" y2="158" stroke="#fc8181" stroke-width="3" stroke-linecap="round"/>
+
+    <line x1="167" y1="86"  x2="300" y2="126" stroke="#4a5568" stroke-width="1.5" stroke-dasharray="5,4" marker-end="url(#arr-gray)"/>
+    <line x1="167" y1="191" x2="300" y2="151" stroke="#4a5568" stroke-width="1.5" stroke-dasharray="5,4" marker-end="url(#arr-gray)"/>
+
+    <rect x="418" y="78"  width="268" height="42" rx="6" fill="#1a202c" stroke="#742a2a" stroke-width="1"/>
+    <text x="552" y="96"  fill="#fc8181" font-size="11" text-anchor="middle">❌  Knowledge from Recruiter A</text>
+    <text x="552" y="110" fill="#718096" font-size="9.5" text-anchor="middle">invisible to the hiring manager session</text>
+
+    <rect x="418" y="134" width="268" height="42" rx="6" fill="#1a202c" stroke="#742a2a" stroke-width="1"/>
+    <text x="552" y="152" fill="#fc8181" font-size="11" text-anchor="middle">❌  Decisions made twice</text>
+    <text x="552" y="166" fill="#718096" font-size="9.5" text-anchor="middle">no shared context, no continuity</text>
+
+    <text x="340" y="196" fill="#fc8181" font-size="9.5" text-anchor="middle">no shared state</text>
   </svg>
 
-  <div class="callout" style="margin-top:.6em;">
-    A recruiter learns a visa policy the hard way. The next recruiter repeats the mistake. The hiring manager has no idea where the pipeline stands.
+  <div class="callout" style="margin-top:.5em; max-width:640px; margin-left:auto; margin-right:auto;">
+    A recruiter learns a visa policy the hard way. The next session repeats the mistake.
+    The hiring manager has no idea where the pipeline stands.
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════ 3 · What Research Says ══ -->
+<section>
+  <h2>What the Research Tells Us</h2>
+  <p style="color:#718096; margin-bottom:.7em;">Three bodies of work converge on the same failure modes.</p>
+
+  <div style="display:grid; grid-template-columns:1fr 1fr 1fr; gap:12px; margin-bottom:.8em;">
+    <div class="ref-card">
+      <div class="ref-title">A Survey on the Memory Mechanism of LLM-based Agents</div>
+      <div class="ref-venue">arXiv 2603.07670</div>
+      <div class="ref-note">Most systems neglect the <em>manage</em> phase — consolidation, conflict resolution, and staleness tracking. Silent contradictions are the most common failure mode.</div>
+    </div>
+    <div class="ref-card">
+      <div class="ref-title">LinkedIn Cognitive Memory Agent (CMA)</div>
+      <div class="ref-venue">LinkedIn Engineering Blog</div>
+      <div class="ref-note">Hierarchical memory with episodic + semantic + procedural types. Trust-weighted retrieval and per-application tenant isolation in production at LinkedIn scale.</div>
+    </div>
+    <div class="ref-card">
+      <div class="ref-title">Practical Guide to LLM Memory Systems</div>
+      <div class="ref-venue">Towards Data Science</div>
+      <div class="ref-note">Trust differentiation between human-authored and agent-authored memories is widely neglected. Staleness is the second leading cause of retrieval degradation.</div>
+    </div>
+  </div>
+
+  <div style="display:grid; grid-template-columns:1fr 1fr; gap:10px;">
+    <div class="callout orange">
+      <strong>Key insight #1</strong> — Memory isn't just storage. Write, retrieval, <em>and management</em> all need first-class design.
+    </div>
+    <div class="callout orange">
+      <strong>Key insight #2</strong> — Human-authored memories must outrank agent-authored ones. Agents can be wrong; humans correct.
+    </div>
   </div>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 3 — Architecture
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 4 · Our Approach ══ -->
+<section>
+  <h2>Our Approach vs. the Literature</h2>
+  <p style="color:#718096; margin-bottom:.6em;">Where we are ahead, and where we deliberately differ.</p>
+
+  <div style="font-size:.78em; width:100%;">
+    <table style="width:100%; border-collapse:collapse; color:#cbd5e0;">
+      <thead>
+        <tr style="border-bottom:1px solid #2d3748;">
+          <th style="text-align:left; padding:6px 8px; color:#718096; font-weight:600; width:26%;">Dimension</th>
+          <th style="text-align:left; padding:6px 8px; color:#718096; font-weight:600; width:37%;">LinkedIn CMA</th>
+          <th style="text-align:left; padding:6px 8px; color:var(--cyan); font-weight:600;">ToolHive Memory</th>
+        </tr>
+      </thead>
+      <tbody>
+        <tr style="border-bottom:1px solid #1a202c;">
+          <td style="padding:5px 8px; color:#a0aec0;">Conflict detection</td>
+          <td style="padding:5px 8px; color:#718096;">On roadmap</td>
+          <td style="padding:5px 8px; color:var(--green);">✅ Built — cosine sim &gt; 0.85 on write</td>
+        </tr>
+        <tr style="border-bottom:1px solid #1a202c;">
+          <td style="padding:5px 8px; color:#a0aec0;">Trust / staleness</td>
+          <td style="padding:5px 8px; color:#718096;">Time-based, on roadmap</td>
+          <td style="padding:5px 8px; color:var(--green);">✅ Built — formula + 24h background job</td>
+        </tr>
+        <tr style="border-bottom:1px solid #1a202c;">
+          <td style="padding:5px 8px; color:#a0aec0;">User control</td>
+          <td style="padding:5px 8px; color:#718096;">Planned</td>
+          <td style="padding:5px 8px; color:var(--green);">✅ list, update, flag, forget</td>
+        </tr>
+        <tr style="border-bottom:1px solid #1a202c;">
+          <td style="padding:5px 8px; color:#a0aec0;">Memory types</td>
+          <td style="padding:5px 8px; color:#718096;">Episodic + Semantic + Procedural</td>
+          <td style="padding:5px 8px; color:#e2e8f0;">Semantic + Episodic + Procedural + Resource</td>
+        </tr>
+        <tr style="border-bottom:1px solid #1a202c;">
+          <td style="padding:5px 8px; color:#a0aec0;">Retrieval</td>
+          <td style="padding:5px 8px; color:#718096;">LLM-orchestrated multi-step</td>
+          <td style="padding:5px 8px; color:#e2e8f0;">Single-pass vector — agent IS the orchestrator</td>
+        </tr>
+        <tr>
+          <td style="padding:5px 8px; color:#a0aec0;">Crystallization</td>
+          <td style="padding:5px 8px; color:#718096;">Not described</td>
+          <td style="padding:5px 8px; color:var(--purple);">✅ Procedural → versioned Skill (OCI)</td>
+        </tr>
+      </tbody>
+    </table>
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════ PART 2 DIVIDER ══ -->
+<section class="divider-slide">
+  <div class="divider-label">Part 2</div>
+  <h1 style="font-size:1.7em;">Architecture</h1>
+  <p style="color:#718096; font-size:.85em; margin-top:.4em;">
+    How it's built — components, memory types, and the full lifecycle.
+  </p>
+</section>
+
+<!-- ══════════════════════════════════════ 5 · Architecture ══ -->
 <section>
   <h2>Architecture</h2>
-  <p style="color:#718096; margin-bottom:.8em;">A shared MCP server any agent session can talk to.</p>
+  <p style="color:#718096; margin-bottom:.6em;">A shared MCP server — any agent session connects with one config file.</p>
 
-  <svg viewBox="0 0 720 300" width="100%" style="max-width:700px;">
+  <svg viewBox="0 0 700 280" width="100%" style="max-width:680px; display:block; margin:0 auto;">
     <defs>
       <marker id="arr-cyan" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
         <path d="M0,0 L0,6 L8,3 z" fill="#00d4ff"/>
@@ -196,163 +308,156 @@ <h2>Architecture</h2>
       </marker>
     </defs>
 
-    <!-- Sessions on left -->
-    <rect x="10"  y="30"  width="150" height="46" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
-    <text x="85"  y="50"  fill="#718096" font-size="10" text-anchor="middle">Claude Code</text>
-    <text x="85"  y="66"  fill="#00d4ff" font-size="12" font-weight="600" text-anchor="middle">Recruiter A</text>
+    <!-- Sessions -->
+    <rect x="8"   y="26"  width="150" height="44" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="83"  y="45"  fill="#718096" font-size="9.5" text-anchor="middle">Claude Code</text>
+    <text x="83"  y="60"  fill="#00d4ff" font-size="11" font-weight="600" text-anchor="middle">Recruiter A</text>
+
+    <rect x="8"   y="118" width="150" height="44" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="83"  y="137" fill="#718096" font-size="9.5" text-anchor="middle">Claude Code</text>
+    <text x="83"  y="152" fill="#00d4ff" font-size="11" font-weight="600" text-anchor="middle">Hiring Manager</text>
 
-    <rect x="10"  y="127" width="150" height="46" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
-    <text x="85"  y="147" fill="#718096" font-size="10" text-anchor="middle">Claude Code</text>
-    <text x="85"  y="163" fill="#00d4ff" font-size="12" font-weight="600" text-anchor="middle">Hiring Manager</text>
+    <rect x="8"   y="210" width="150" height="44" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="83"  y="229" fill="#718096" font-size="9.5" text-anchor="middle">Claude Code</text>
+    <text x="83"  y="244" fill="#00d4ff" font-size="11" font-weight="600" text-anchor="middle">Recruiter B</text>
 
-    <rect x="10"  y="224" width="150" height="46" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
-    <text x="85"  y="244" fill="#718096" font-size="10" text-anchor="middle">Claude Code</text>
-    <text x="85"  y="260" fill="#00d4ff" font-size="12" font-weight="600" text-anchor="middle">Recruiter B</text>
+    <!-- HTTP/MCP label -->
+    <text x="196" y="95" fill="#4a5568" font-size="9" text-anchor="middle">HTTP / MCP</text>
 
-    <!-- Arrows to Memory Server -->
-    <line x1="162" y1="53"  x2="272" y2="130" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
-    <line x1="162" y1="150" x2="272" y2="150" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
-    <line x1="162" y1="247" x2="272" y2="170" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
-    <text x="212" y="105" fill="#718096" font-size="9" text-anchor="middle">HTTP / MCP</text>
+    <!-- Arrows to server -->
+    <line x1="160" y1="48"  x2="264" y2="120" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
+    <line x1="160" y1="140" x2="264" y2="140" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
+    <line x1="160" y1="232" x2="264" y2="160" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
 
     <!-- Memory Server -->
-    <rect x="278" y="98" width="180" height="104" rx="10" fill="#0d1f2d" stroke="#00d4ff" stroke-width="2"/>
-    <text x="368" y="120" fill="#00d4ff" font-size="11" font-weight="700" text-anchor="middle">Memory Server</text>
-    <line x1="298" y1="128" x2="438" y2="128" stroke="#1a3a4a" stroke-width="1"/>
-    <text x="368" y="144" fill="#718096" font-size="9.5" text-anchor="middle">memory_remember</text>
-    <text x="368" y="158" fill="#718096" font-size="9.5" text-anchor="middle">memory_search</text>
-    <text x="368" y="172" fill="#718096" font-size="9.5" text-anchor="middle">memory_crystallize</text>
-    <text x="368" y="186" fill="#718096" font-size="9.5" text-anchor="middle">+ resources / list</text>
+    <rect x="270" y="88" width="178" height="104" rx="10" fill="#0d1f2d" stroke="#00d4ff" stroke-width="2"/>
+    <text x="359" y="108" fill="#00d4ff" font-size="11" font-weight="700" text-anchor="middle">Memory Server</text>
+    <line x1="290" y1="115" x2="428" y2="115" stroke="#1a3a4a" stroke-width="1"/>
+    <text x="359" y="130" fill="#718096" font-size="9" text-anchor="middle">memory_remember / search</text>
+    <text x="359" y="144" fill="#718096" font-size="9" text-anchor="middle">memory_crystallize / flag</text>
+    <text x="359" y="158" fill="#718096" font-size="9" text-anchor="middle">resources/list · api/resources</text>
+    <text x="359" y="178" fill="#4a5568" font-size="8.5" text-anchor="middle">MCP Streamable HTTP</text>
 
     <!-- Arrows to backends -->
-    <line x1="458" y1="125" x2="540" y2="80"  stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
-    <line x1="458" y1="150" x2="540" y2="150" stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
-    <line x1="458" y1="175" x2="540" y2="220" stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
-
-    <!-- Backends on right -->
-    <rect x="546" y="46"  width="158" height="46" rx="8" fill="#1a202c" stroke="#48bb78" stroke-width="1.5"/>
-    <text x="625" y="65"  fill="#718096" font-size="10" text-anchor="middle">SQLite + sqlite-vec</text>
-    <text x="625" y="81"  fill="#48bb78" font-size="11" font-weight="600" text-anchor="middle">Storage + Vectors</text>
-
-    <rect x="546" y="127" width="158" height="46" rx="8" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
-    <text x="625" y="146" fill="#718096" font-size="10" text-anchor="middle">goose migrations</text>
-    <text x="625" y="162" fill="#9f7aea" font-size="11" font-weight="600" text-anchor="middle">Schema Manager</text>
-
-    <rect x="546" y="208" width="158" height="46" rx="8" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
-    <text x="625" y="227" fill="#718096" font-size="10" text-anchor="middle">nomic-embed-text</text>
-    <text x="625" y="243" fill="#f6e05e" font-size="11" font-weight="600" text-anchor="middle">Ollama Embedder</text>
+    <line x1="450" y1="112" x2="530" y2="68"  stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
+    <line x1="450" y1="140" x2="530" y2="140" stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
+    <line x1="450" y1="168" x2="530" y2="212" stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
+
+    <!-- Backends -->
+    <rect x="536" y="38"  width="155" height="44" rx="7" fill="#1a202c" stroke="#48bb78" stroke-width="1.5"/>
+    <text x="613" y="57"  fill="#718096" font-size="9.5" text-anchor="middle">SQLite + sqlite-vec</text>
+    <text x="613" y="72"  fill="#48bb78" font-size="11" font-weight="600" text-anchor="middle">Storage + Vectors</text>
+
+    <rect x="536" y="118" width="155" height="44" rx="7" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
+    <text x="613" y="137" fill="#718096" font-size="9.5" text-anchor="middle">goose migrations</text>
+    <text x="613" y="152" fill="#9f7aea" font-size="11" font-weight="600" text-anchor="middle">Schema Manager</text>
+
+    <rect x="536" y="198" width="155" height="44" rx="7" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
+    <text x="613" y="217" fill="#718096" font-size="9.5" text-anchor="middle">nomic-embed-text</text>
+    <text x="613" y="232" fill="#f6e05e" font-size="11" font-weight="600" text-anchor="middle">Ollama Embedder</text>
   </svg>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 4 — Memory Types
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 6 · Memory Types ══ -->
 <section>
   <h2>Memory Types</h2>
-  <p style="color:#718096; margin-bottom:.8em;">Four types cover everything from reference docs to learned processes.</p>
-
-  <div class="card-grid">
-    <div class="card" style="border-color:rgba(0,212,255,.3);">
-      <div class="icon">📄</div>
-      <div class="title" style="color:var(--cyan);">Resource</div>
-      <div class="desc">Read-only reference documents uploaded via REST API. Agents discover them through MCP <em>resources/list</em> or <em>memory_search</em>. Never modified by agents.</div>
-      <div style="margin-top:8px;"><span class="tag tag-cyan">source: resource</span></div>
+  <p style="color:#718096; margin-bottom:.6em;">Four types cover reference docs, facts, events, and learned processes.</p>
+
+  <div style="max-width:680px; margin:0 auto;">
+    <div class="type-row" style="border-color:rgba(0,212,255,.25);">
+      <div class="type-icon">📄</div>
+      <div>
+        <div class="type-label" style="color:var(--cyan);">Resource</div>
+        <div class="type-desc">Read-only reference documents uploaded via REST API. Agents discover via <code>resources/list</code> or <code>memory_search</code> — never writable by agents. <span class="tag tag-cyan" style="vertical-align:middle;">source: resource</span></div>
+      </div>
     </div>
-    <div class="card" style="border-color:rgba(72,187,120,.3);">
-      <div class="icon">🧠</div>
-      <div class="title" style="color:var(--green);">Semantic</div>
-      <div class="desc">Aggregated facts and domain knowledge — things that are durably true. Conflict detection prevents silent contradictions on write.</div>
-      <div style="margin-top:8px;"><span class="tag tag-green">author: human | agent</span></div>
+    <div class="type-row" style="border-color:rgba(72,187,120,.25);">
+      <div class="type-icon">🧠</div>
+      <div>
+        <div class="type-label" style="color:var(--green);">Semantic</div>
+        <div class="type-desc">Aggregated facts and domain knowledge — things that are durably true. Conflict detection (cosine sim &gt; 0.85) prevents silent contradictions on write. <span class="tag tag-green" style="vertical-align:middle;">human | agent</span></div>
+      </div>
     </div>
-    <div class="card" style="border-color:rgba(246,224,94,.3);">
-      <div class="icon">📅</div>
-      <div class="title" style="color:var(--yellow);">Episodic</div>
-      <div class="desc">Time-indexed event records — things that <em>happened</em>. Phone screens, decisions, observations. Queryable by time range and tags.</div>
-      <div style="margin-top:8px;"><span class="tag tag-yellow">e.g. "Alice Chen screened 2024-03-10"</span></div>
+    <div class="type-row" style="border-color:rgba(246,224,94,.25);">
+      <div class="type-icon">📅</div>
+      <div>
+        <div class="type-label" style="color:var(--yellow);">Episodic</div>
+        <div class="type-desc">Time-indexed event records — things that <em>happened</em>. Phone screens, decisions, observations. Queryable by tags and time range. <span class="tag tag-yellow" style="vertical-align:middle;">e.g. "Alice Chen screened 2024-03-10"</span></div>
+      </div>
     </div>
-    <div class="card" style="border-color:rgba(159,122,234,.3);">
-      <div class="icon">🔧</div>
-      <div class="title" style="color:var(--purple);">Procedural</div>
-      <div class="desc">Learned behaviors and processes — how to do things. Emerges from episodic patterns. Can be <em>crystallized</em> into a versioned Skill runbook.</div>
-      <div style="margin-top:8px;"><span class="tag tag-purple">crystallizable → Skill</span></div>
+    <div class="type-row" style="border-color:rgba(159,122,234,.25);">
+      <div class="type-icon">🔧</div>
+      <div>
+        <div class="type-label" style="color:var(--purple);">Procedural</div>
+        <div class="type-desc">Learned behaviors and processes. Emerges from episodic patterns. Can be <em>crystallized</em> into a versioned Skill (OCI artifact) the whole team can reuse. <span class="tag tag-purple" style="vertical-align:middle;">crystallizable → Skill</span></div>
+      </div>
     </div>
   </div>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 5 — Memory Lifecycle
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 7 · Lifecycle ══ -->
 <section>
   <h2>Memory Lifecycle</h2>
-  <p style="color:#718096; margin-bottom:.8em;">Memory is managed — not just stored.</p>
+  <p style="color:#718096; margin-bottom:.6em;">Memory is managed — not just stored.</p>
 
-  <svg viewBox="0 0 720 200" width="100%" style="max-width:700px;">
+  <svg viewBox="0 0 700 175" width="100%" style="max-width:680px; display:block; margin:0 auto 10px;">
     <defs>
       <marker id="arr-lc" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
         <path d="M0,0 L0,6 L8,3 z" fill="#4a5568"/>
       </marker>
-      <marker id="arr-crystal" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
+      <marker id="arr-cr" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
         <path d="M0,0 L0,6 L8,3 z" fill="#9f7aea"/>
       </marker>
     </defs>
 
-    <!-- Nodes -->
-    <!-- Remember -->
-    <rect x="10"  y="70" width="110" height="52" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
-    <text x="65"  y="92"  fill="#00d4ff" font-size="11" font-weight="700" text-anchor="middle">Remember</text>
-    <text x="65"  y="108" fill="#718096" font-size="9" text-anchor="middle">embed + conflict check</text>
-
-    <!-- Search -->
-    <rect x="160" y="70" width="110" height="52" rx="8" fill="#1a202c" stroke="#48bb78" stroke-width="1.5"/>
-    <text x="215" y="92"  fill="#48bb78" font-size="11" font-weight="700" text-anchor="middle">Search</text>
-    <text x="215" y="108" fill="#718096" font-size="9" text-anchor="middle">vector + trust-weighted</text>
-
-    <!-- Flag / Update -->
-    <rect x="310" y="70" width="110" height="52" rx="8" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
-    <text x="365" y="92"  fill="#f6e05e" font-size="11" font-weight="700" text-anchor="middle">Flag / Update</text>
-    <text x="365" y="108" fill="#718096" font-size="9" text-anchor="middle">correct or mark stale</text>
-
-    <!-- Consolidate -->
-    <rect x="460" y="70" width="110" height="52" rx="8" fill="#1a202c" stroke="#ed8936" stroke-width="1.5"/>
-    <text x="515" y="92"  fill="#ed8936" font-size="11" font-weight="700" text-anchor="middle">Consolidate</text>
-    <text x="515" y="108" fill="#718096" font-size="9" text-anchor="middle">merge related entries</text>
-
-    <!-- Crystallize -->
-    <rect x="610" y="70" width="100" height="52" rx="8" fill="#1a202c" stroke="#9f7aea" stroke-width="2"/>
-    <text x="660" y="92"  fill="#9f7aea" font-size="11" font-weight="700" text-anchor="middle">Crystallize</text>
-    <text x="660" y="108" fill="#718096" font-size="9" text-anchor="middle">→ Skill runbook</text>
-
-    <!-- Arrows -->
-    <line x1="120" y1="96" x2="157" y2="96" stroke="#4a5568" stroke-width="1.5" marker-end="url(#arr-lc)"/>
-    <line x1="270" y1="96" x2="307" y2="96" stroke="#4a5568" stroke-width="1.5" marker-end="url(#arr-lc)"/>
-    <line x1="420" y1="96" x2="457" y2="96" stroke="#4a5568" stroke-width="1.5" marker-end="url(#arr-lc)"/>
-    <line x1="570" y1="96" x2="607" y2="96" stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-crystal)"/>
-
-    <!-- Trust/staleness note -->
-    <rect x="130" y="158" width="460" height="30" rx="6" fill="rgba(0,212,255,.05)" stroke="rgba(0,212,255,.2)" stroke-width="1"/>
-    <text x="360" y="178" fill="#718096" font-size="10" text-anchor="middle">
-      Background job every 24h: recomputes trust &amp; staleness scores, expires TTL'd entries, surfaces consolidation candidates
+    <rect x="8"   y="62" width="108" height="50" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="62"  y="84"  fill="#00d4ff" font-size="10.5" font-weight="700" text-anchor="middle">Remember</text>
+    <text x="62"  y="99"  fill="#718096" font-size="8.5" text-anchor="middle">embed + conflict check</text>
+
+    <rect x="155" y="62" width="108" height="50" rx="8" fill="#1a202c" stroke="#48bb78" stroke-width="1.5"/>
+    <text x="209" y="84"  fill="#48bb78" font-size="10.5" font-weight="700" text-anchor="middle">Search</text>
+    <text x="209" y="99"  fill="#718096" font-size="8.5" text-anchor="middle">vector + trust-ranked</text>
+
+    <rect x="302" y="62" width="108" height="50" rx="8" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
+    <text x="356" y="84"  fill="#f6e05e" font-size="10.5" font-weight="700" text-anchor="middle">Flag / Update</text>
+    <text x="356" y="99"  fill="#718096" font-size="8.5" text-anchor="middle">correct or mark stale</text>
+
+    <rect x="449" y="62" width="108" height="50" rx="8" fill="#1a202c" stroke="#ed8936" stroke-width="1.5"/>
+    <text x="503" y="84"  fill="#ed8936" font-size="10.5" font-weight="700" text-anchor="middle">Consolidate</text>
+    <text x="503" y="99"  fill="#718096" font-size="8.5" text-anchor="middle">merge related entries</text>
+
+    <rect x="596" y="62" width="96" height="50" rx="8" fill="#1a202c" stroke="#9f7aea" stroke-width="2"/>
+    <text x="644" y="84"  fill="#9f7aea" font-size="10.5" font-weight="700" text-anchor="middle">Crystallize</text>
+    <text x="644" y="99"  fill="#718096" font-size="8.5" text-anchor="middle">→ Skill runbook</text>
+
+    <line x1="118" y1="87" x2="152" y2="87" stroke="#4a5568" stroke-width="1.5" marker-end="url(#arr-lc)"/>
+    <line x1="265" y1="87" x2="299" y2="87" stroke="#4a5568" stroke-width="1.5" marker-end="url(#arr-lc)"/>
+    <line x1="412" y1="87" x2="446" y2="87" stroke="#4a5568" stroke-width="1.5" marker-end="url(#arr-lc)"/>
+    <line x1="559" y1="87" x2="593" y2="87" stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-cr)"/>
+
+    <rect x="100" y="140" width="500" height="26" rx="5" fill="rgba(0,212,255,.04)" stroke="rgba(0,212,255,.15)" stroke-width="1"/>
+    <text x="350" y="157" fill="#718096" font-size="9" text-anchor="middle">
+      Background job every 24h: recomputes trust &amp; staleness scores · expires TTL'd entries · surfaces consolidation candidates (sim &gt; 0.92)
     </text>
   </svg>
 
-  <div class="two-col" style="margin-top:.6em;">
-    <div class="callout">
-      <strong>Trust score</strong> — author weight × age decay × correction penalty × flag penalty
+  <div style="display:grid; grid-template-columns:1fr 1fr; gap:10px; max-width:680px; margin:0 auto;">
+    <div class="callout" style="font-size:.75em;">
+      <strong>Trust score</strong> = author weight × age decay × correction penalty × flag penalty.<br>
+      Human-authored entries always outrank agent-authored ones.
     </div>
-    <div class="callout">
-      <strong>Conflict detection</strong> — cosine similarity &gt; 0.85 on write returns conflicts; agent decides
+    <div class="callout" style="font-size:.75em;">
+      <strong>Conflict detection</strong> on write — cosine similarity &gt; 0.85 returns matching entries. The agent (with context) decides: force-write, update, or abort.
     </div>
   </div>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 6 — Skills Integration
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 8 · Skills ══ -->
 <section>
   <h2>From Memory to Skill</h2>
-  <p style="color:#718096; margin-bottom:.8em;">Fluid procedural knowledge crystallizes into versioned, distributable runbooks.</p>
+  <p style="color:#718096; margin-bottom:.6em;">Fluid procedural knowledge crystallizes into versioned, distributable runbooks.</p>
 
-  <svg viewBox="0 0 680 180" width="100%" style="max-width:660px;">
+  <svg viewBox="0 0 660 165" width="100%" style="max-width:640px; display:block; margin:0 auto 10px;">
     <defs>
       <marker id="arr-sk" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
         <path d="M0,0 L0,6 L8,3 z" fill="#9f7aea"/>
@@ -362,136 +467,138 @@ <h2>From Memory to Skill</h2>
       </marker>
     </defs>
 
-    <!-- Procedural memories -->
-    <rect x="10"  y="30"  width="155" height="36" rx="6" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
-    <text x="87"  y="53"  fill="#9f7aea" font-size="11" font-weight="600" text-anchor="middle">🔧 Procedural memories</text>
+    <rect x="10"  y="24"  width="148" height="34" rx="6" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
+    <text x="84"  y="46"  fill="#9f7aea" font-size="10.5" font-weight="600" text-anchor="middle">🔧 Procedural memory</text>
 
-    <rect x="10"  y="80"  width="155" height="36" rx="6" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
-    <text x="87"  y="103" fill="#9f7aea" font-size="11" font-weight="600" text-anchor="middle">🔧 Procedural memories</text>
+    <rect x="10"  y="74"  width="148" height="34" rx="6" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
+    <text x="84"  y="96"  fill="#9f7aea" font-size="10.5" font-weight="600" text-anchor="middle">🔧 Procedural memory</text>
 
-    <rect x="10"  y="130" width="155" height="36" rx="6" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
-    <text x="87"  y="153" fill="#9f7aea" font-size="11" font-weight="600" text-anchor="middle">🔧 Procedural memories</text>
+    <rect x="10"  y="124" width="148" height="34" rx="6" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
+    <text x="84"  y="146" fill="#9f7aea" font-size="10.5" font-weight="600" text-anchor="middle">🔧 Procedural memory</text>
 
-    <!-- Crystallize -->
-    <line x1="166" y1="48"  x2="254" y2="88"  stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-sk)"/>
-    <line x1="166" y1="98"  x2="254" y2="98"  stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-sk)"/>
-    <line x1="166" y1="148" x2="254" y2="108" stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-sk)"/>
+    <line x1="160" y1="41"  x2="242" y2="82"  stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-sk)"/>
+    <line x1="160" y1="91"  x2="242" y2="91"  stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-sk)"/>
+    <line x1="160" y1="141" x2="242" y2="100" stroke="#9f7aea" stroke-width="1.5" marker-end="url(#arr-sk)"/>
 
-    <rect x="260" y="68" width="140" height="60" rx="8" fill="#0d1f2d" stroke="#9f7aea" stroke-width="2"/>
-    <text x="330" y="93"  fill="#9f7aea" font-size="11" font-weight="700" text-anchor="middle">memory_crystallize</text>
-    <text x="330" y="110" fill="#718096" font-size="9.5" text-anchor="middle">drafts SKILL.md scaffold</text>
-    <text x="330" y="123" fill="#718096" font-size="9.5" text-anchor="middle">human authors + pushes</text>
+    <rect x="248" y="62" width="140" height="58" rx="8" fill="#0d1f2d" stroke="#9f7aea" stroke-width="2"/>
+    <text x="318" y="84"  fill="#9f7aea" font-size="10.5" font-weight="700" text-anchor="middle">memory_crystallize</text>
+    <text x="318" y="99"  fill="#718096" font-size="8.5" text-anchor="middle">drafts SKILL.md scaffold</text>
+    <text x="318" y="113" fill="#718096" font-size="8.5" text-anchor="middle">human authors + reviews</text>
 
-    <!-- Arrow to Skill OCI -->
-    <line x1="402" y1="98" x2="484" y2="98" stroke="#48bb78" stroke-width="2" marker-end="url(#arr-sk2)"/>
+    <line x1="390" y1="91" x2="468" y2="91" stroke="#48bb78" stroke-width="2" marker-end="url(#arr-sk2)"/>
+    <text x="430" y="83"  fill="#718096" font-size="9" text-anchor="middle">thv skills push</text>
 
-    <!-- Skill -->
-    <rect x="490" y="68" width="180" height="60" rx="8" fill="#1a202c" stroke="#48bb78" stroke-width="2"/>
-    <text x="580" y="90"  fill="#48bb78" font-size="11" font-weight="700" text-anchor="middle">Skill (OCI artifact)</text>
-    <text x="580" y="107" fill="#718096" font-size="9.5" text-anchor="middle">versioned · immutable</text>
-    <text x="580" y="120" fill="#718096" font-size="9.5" text-anchor="middle">distributable across teams</text>
+    <rect x="474" y="62" width="178" height="58" rx="8" fill="#1a202c" stroke="#48bb78" stroke-width="2"/>
+    <text x="563" y="84"  fill="#48bb78" font-size="10.5" font-weight="700" text-anchor="middle">Skill  (OCI artifact)</text>
+    <text x="563" y="99"  fill="#718096" font-size="8.5" text-anchor="middle">versioned · immutable</text>
+    <text x="563" y="113" fill="#718096" font-size="8.5" text-anchor="middle">distributable across teams</text>
 
-    <!-- crystallized_into label on originals -->
-    <text x="87" y="180" fill="#4a5568" font-size="9" text-anchor="middle">archived with crystallized_into pointer</text>
+    <text x="84" y="163" fill="#4a5568" font-size="8.5" text-anchor="middle">archived with crystallized_into pointer</text>
   </svg>
 
-  <div class="callout purple" style="margin-top:.5em;">
-    Procedural memories and Skills are the same knowledge at different stages — fluid and evolving in memory, crystallized and versioned as a Skill.
+  <div class="callout purple" style="max-width:640px; margin:0 auto; font-size:.78em;">
+    Procedural memories and Skills are the same knowledge at different stages of maturity —
+    fluid and evolving in memory, crystallized and versioned as a Skill.
   </div>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 7 — Demo Title
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ PART 3 DIVIDER ══ -->
+<section class="divider-slide">
+  <div class="divider-label">Part 3</div>
+  <h1 style="font-size:1.7em;">Live Demo</h1>
+  <p style="color:#718096; font-size:.9em; margin-top:.4em;">
+    The Recruiter — hiring a Senior Go Engineer at Stacklok
+  </p>
+</section>
+
+<!-- ══════════════════════════════════════ 9 · Demo Intro ══ -->
 <section>
-  <div style="margin-bottom:.6em;">
-    <span class="tag tag-cyan" style="font-size:.85em;">Live Demo</span>
-  </div>
-  <h1 style="font-size:2em; margin-bottom:.2em;">The Recruiter</h1>
-  <p style="font-size:1em; color:#a0aec0; margin-bottom:1.4em;">Hiring a Senior Go Engineer at Stacklok</p>
+  <h2>The Recruiter Scenario</h2>
+  <p style="color:#718096; margin-bottom:.8em;">A one-week hiring process — every session shares a single memory server.</p>
 
-  <div class="two-col" style="max-width:620px; margin:0 auto;">
-    <div style="text-align:left;">
-      <p style="font-size:.8em; color:#718096; margin-bottom:.4em;">Cast</p>
-      <div style="font-size:.82em; line-height:2;">
+  <div class="two-col" style="max-width:640px; margin:0 auto;">
+    <div>
+      <p style="font-size:.78em; color:#718096; margin-bottom:.4em;">Cast</p>
+      <div style="font-size:.8em; line-height:2.1;">
         👩 <strong>Recruiter</strong> — runs phone screens<br>
         🧑‍💼 <strong>Hiring Manager</strong> — checks pipeline cold<br>
-        🖥️ <strong>Memory Server</strong> — shared between all sessions
+        🖥️ <strong>Memory Server</strong> — one server, all sessions
       </div>
     </div>
-    <div style="text-align:left;">
-      <p style="font-size:.8em; color:#718096; margin-bottom:.4em;">What we'll see</p>
-      <div style="font-size:.82em; line-height:2;">
-        ✅ Cross-session knowledge sharing<br>
+    <div>
+      <p style="font-size:.78em; color:#718096; margin-bottom:.4em;">What we'll see</p>
+      <div style="font-size:.8em; line-height:2.1;">
         ✅ Policy recalled without being told<br>
-        ✅ Process learned from failure<br>
-        ✅ Runbook born from experience
+        ✅ Cross-session knowledge sharing<br>
+        ✅ Process learned from repeated failure<br>
+        ✅ Runbook born from lived experience
       </div>
     </div>
   </div>
+
+  <div style="margin-top:.8em; font-size:.74em; color:#4a5568; background:#0d1117; border:1px solid #1a202c; border-radius:6px; padding:8px 14px; display:inline-block;">
+    <code style="color:#718096;">claude --mcp-config .demo.mcp.json</code>
+    &nbsp;—&nbsp; the only integration needed
+  </div>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 8 — Demo Overview (all phases)
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 10 · Scenario Overview ══ -->
 <section>
-  <h2>Scenario Overview</h2>
+  <h2>Scenario — All Phases</h2>
   <ul class="phase-list">
     <li>
       <div class="phase-num">1</div>
       <div class="phase-text">
-        <strong>Resource</strong> &nbsp;<span class="tag tag-cyan">resource</span><br>
-        <span>Upload job description as a read-only MCP Resource — agents can discover it via memory_search</span>
+        <strong>Resource upload</strong> &nbsp;<span class="tag tag-cyan">resource</span><br>
+        <span>Job description registered as a read-only MCP Resource — discoverable, never modifiable</span>
       </div>
     </li>
     <li>
       <div class="phase-num">2</div>
       <div class="phase-text">
-        <strong>Semantic Memory</strong> &nbsp;<span class="tag tag-green">semantic</span><br>
-        <span>Prime 3 company-wide facts: no visa sponsorship, salary band $100–150K, remote US async culture</span>
+        <strong>Semantic memory</strong> &nbsp;<span class="tag tag-green">semantic</span><br>
+        <span>3 company-wide facts: no visa sponsorship · salary $100–150K · remote US async culture</span>
       </div>
     </li>
     <li>
       <div class="phase-num">3</div>
       <div class="phase-text">
-        <strong>Recruiter — Alice Chen</strong> &nbsp;<span class="tag tag-yellow">episodic</span><br>
-        <span>Strong candidate, needs H1-B. Agent searches policy, finds the blocker, logs the outcome</span>
+        <strong>Alice Chen</strong> &nbsp;<span class="tag tag-yellow">episodic</span><br>
+        <span>Strong candidate, needs H1-B. Agent searches policy, finds blocker, logs outcome</span>
       </div>
     </li>
     <li>
       <div class="phase-num">4</div>
       <div class="phase-text">
         <strong>Hiring Manager — cold search</strong> &nbsp;<span class="tag tag-green">semantic</span> <span class="tag tag-yellow">episodic</span><br>
-        <span>Joins cold. Searches pipeline, comp, JD — gets a full picture from memory alone</span>
+        <span>Joins with zero context. Memory gives full pipeline status, comp band, and JD</span>
       </div>
     </li>
     <li>
       <div class="phase-num">5</div>
       <div class="phase-text">
-        <strong>Recruiter — Bob Martinez</strong> &nbsp;<span class="tag tag-yellow">episodic</span> <span class="tag tag-purple">procedural</span><br>
-        <span>Bob archived. Recruiter notices a pattern → writes a procedural memory for next screens</span>
+        <strong>Bob Martinez</strong> &nbsp;<span class="tag tag-yellow">episodic</span> <span class="tag tag-purple">procedural</span><br>
+        <span>Archived. Recruiter spots a pattern → agent writes a procedural memory unprompted</span>
       </div>
     </li>
     <li>
       <div class="phase-num">6</div>
       <div class="phase-text">
-        <strong>Recruiter — Charlie Kim</strong> &nbsp;<span class="tag tag-purple">procedural</span> <span class="tag tag-yellow">episodic</span><br>
-        <span>Retrieves the checklist before the screen. Applies it. Charlie advances to the full loop.</span>
+        <strong>Charlie Kim</strong> &nbsp;<span class="tag tag-purple">procedural</span> <span class="tag tag-yellow">episodic</span><br>
+        <span>Retrieves the checklist (written by a different session). Applies it. Charlie advances.</span>
       </div>
     </li>
     <li>
       <div class="phase-num">7</div>
       <div class="phase-text">
         <strong>Crystallize → Skill</strong> &nbsp;<span class="tag tag-purple">procedural</span><br>
-        <span>One week of screens → crystallize → phone-screen runbook the whole team can reuse</span>
+        <span>One week of screens → phone-screen runbook the whole recruiting team can reuse</span>
       </div>
     </li>
   </ul>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 9 — Phase 1-2: Setup
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 11 · Phases 1-2 ══ -->
 <section>
   <div class="scenario-header">
     <div class="phase-badge">Phases 1 – 2</div>
@@ -500,244 +607,228 @@ <h2>Scenario Overview</h2>
 
   <div class="two-col">
     <div>
-      <p style="font-size:.8em; color:#718096; margin-bottom:.5em;">Phase 1 · Resource</p>
-      <div class="callout" style="font-size:.78em;">
+      <p style="font-size:.76em; color:#718096; margin-bottom:.4em;">Phase 1 · Resource</p>
+      <div class="callout" style="font-size:.76em;">
         <code style="color:var(--cyan);">POST /api/resources</code><br><br>
         Job description uploaded as a <strong>read-only MCP Resource</strong>.<br>
         Agents discover it via <code>memory_search</code> or <code>resources/list</code>.<br>
-        Cannot be modified or deleted by any agent.
+        Protected by <code>ErrReadOnly</code> — no agent can modify it.
       </div>
     </div>
     <div>
-      <p style="font-size:.8em; color:#718096; margin-bottom:.5em;">Phase 2 · Semantic Memory</p>
-      <div class="callout green" style="font-size:.78em; margin-bottom:6px;">
+      <p style="font-size:.76em; color:#718096; margin-bottom:.4em;">Phase 2 · Semantic memory</p>
+      <div class="callout green" style="font-size:.75em; margin-bottom:5px;">
         🧠 &nbsp;Company does not sponsor US work visas for any engineering role
       </div>
-      <div class="callout green" style="font-size:.78em; margin-bottom:6px;">
+      <div class="callout green" style="font-size:.75em; margin-bottom:5px;">
         🧠 &nbsp;Senior Go Engineer base: $100K–$150K + equity
       </div>
-      <div class="callout green" style="font-size:.78em;">
+      <div class="callout green" style="font-size:.75em;">
         🧠 &nbsp;Engineering team fully remote, US timezone, async-first
       </div>
     </div>
   </div>
-  <p style="font-size:.74em; color:#4a5568; margin-top:.8em;">Written once by the setup script — recalled by any agent session at any time.</p>
+  <p style="font-size:.72em; color:#4a5568; margin-top:.6em; text-align:center;">Written once by the setup script — recalled by any agent session at any time.</p>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 10 — Phase 3: Alice
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 12 · Alice ══ -->
 <section>
   <div class="scenario-header">
     <div class="phase-badge">Phase 3</div>
-    <div class="phase-title">Recruiter Session — Alice Chen phone screen</div>
+    <div class="phase-title">Recruiter — Alice Chen phone screen</div>
   </div>
 
   <div class="two-col">
     <div>
-      <p style="font-size:.78em; color:#718096; margin-bottom:.4em;">The recruiter says</p>
-      <div style="background:#1a202c; border-radius:8px; padding:12px 14px; font-size:.78em; color:#a0aec0; font-style:italic; line-height:1.6; border:1px solid #2d3748;">
-        "She mentioned she's on OPT and would need an H1-B transfer. Before I move her forward, I want to make sure that's not a blocker. Can you check if we have any policy on that?"
+      <p style="font-size:.76em; color:#718096; margin-bottom:.3em;">The recruiter says</p>
+      <div style="background:#1a202c; border-radius:7px; padding:10px 12px; font-size:.76em; color:#a0aec0; font-style:italic; line-height:1.6; border:1px solid #2d3748;">
+        "She mentioned she's on OPT and would need an H1-B transfer. Before I move her forward I want to make sure that's not a blocker. Can you check if we have any policy on that?"
       </div>
     </div>
     <div>
-      <p style="font-size:.78em; color:#718096; margin-bottom:.4em;">What the agent does</p>
-      <div style="font-size:.78em; line-height:1.8;">
+      <p style="font-size:.76em; color:#718096; margin-bottom:.3em;">What the agent does</p>
+      <div style="font-size:.76em; line-height:1.9;">
         <div style="color:#48bb78;">→ <code>memory_search("visa sponsorship policy")</code></div>
-        <div style="color:#718096; padding-left:16px; margin-bottom:6px;">Finds: "Company does not sponsor US work visas"</div>
+        <div style="color:#718096; padding-left:14px; margin-bottom:5px;">Finds: "Company does not sponsor US work visas"</div>
         <div style="color:#f6e05e;">→ <code>memory_remember</code> (episodic)</div>
-        <div style="color:#718096; padding-left:16px;">Alice Chen — OPT, needs H1-B → archived</div>
+        <div style="color:#718096; padding-left:14px;">Alice Chen — OPT / H1-B needed → archived</div>
       </div>
     </div>
   </div>
 
-  <div class="callout yellow" style="margin-top:.8em; font-size:.8em;">
-    The agent found a policy it was never told about in this session — it came from shared memory written in Phase 2.
+  <div class="callout yellow" style="margin-top:.7em; font-size:.78em;">
+    The agent found a policy it was <strong>never told about</strong> in this session —
+    retrieved from shared memory written in Phase 2.
   </div>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 11 — Phase 4: Hiring Manager
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 13 · Hiring Manager ══ -->
 <section>
   <div class="scenario-header">
     <div class="phase-badge">Phase 4</div>
-    <div class="phase-title">Hiring Manager — cold search</div>
+    <div class="phase-title">Hiring Manager — cold pipeline review</div>
   </div>
 
-  <p style="font-size:.8em; color:#718096; margin-bottom:.6em; font-style:italic;">
-    "I haven't been in the loop on recruiting — can you catch me up? I'd like to know who's been screened, where they stand, the approved comp range, and a reminder of what we're hiring for."
+  <p style="font-size:.78em; color:#a0aec0; font-style:italic; margin-bottom:.6em;">
+    "I haven't been in the loop on recruiting — can you catch me up? Pipeline status, approved comp range, and a reminder of what we're hiring for."
   </p>
 
-  <div class="card-grid">
-    <div class="card" style="border-color:rgba(72,187,120,.3);">
-      <div class="title" style="color:var(--green); font-size:.78em;">memory_search("candidates screened")</div>
-      <div class="desc">Finds Alice Chen → archived (visa). Pipeline: 1 of 1 archived.</div>
-    </div>
-    <div class="card" style="border-color:rgba(72,187,120,.3);">
-      <div class="title" style="color:var(--green); font-size:.78em;">memory_search("visa sponsorship")</div>
-      <div class="desc">Confirms no-sponsorship policy. Explains why Alice was archived.</div>
-    </div>
-    <div class="card" style="border-color:rgba(72,187,120,.3);">
-      <div class="title" style="color:var(--green); font-size:.78em;">memory_search("salary compensation")</div>
-      <div class="desc">$100K–$150K base + equity. Approved band retrieved.</div>
-    </div>
-    <div class="card" style="border-color:rgba(0,212,255,.3);">
-      <div class="title" style="color:var(--cyan); font-size:.78em;">memory_search("job description")</div>
-      <div class="desc">Retrieves the JD Resource. Full role requirements surfaced.</div>
-    </div>
+  <div style="display:grid; grid-template-columns:1fr 1fr; gap:10px;">
+    <div class="callout green" style="font-size:.75em;"><code>memory_search("candidates screened")</code><br>Alice Chen → archived (visa). 1 of 1.</div>
+    <div class="callout green" style="font-size:.75em;"><code>memory_search("visa sponsorship")</code><br>No sponsorship policy. Explains Alice.</div>
+    <div class="callout green" style="font-size:.75em;"><code>memory_search("salary compensation")</code><br>$100K–$150K base + equity. Approved band.</div>
+    <div class="callout" style="font-size:.75em;"><code>memory_search("job description")</code><br>Retrieves the JD Resource. Full requirements.</div>
   </div>
-  <p style="font-size:.72em; color:#4a5568; margin-top:.6em;">The hiring manager never spoke to the recruiter. The memory server was the handoff.</p>
+
+  <p style="font-size:.72em; color:#4a5568; margin-top:.6em; text-align:center;">The hiring manager never spoke to the recruiter. The memory server was the handoff.</p>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 12 — Phase 5: Bob + Procedural
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 14 · Bob ══ -->
 <section>
   <div class="scenario-header">
     <div class="phase-badge">Phase 5</div>
-    <div class="phase-title">Recruiter Session — Bob Martinez + a lesson learned</div>
+    <div class="phase-title">Recruiter — Bob Martinez + a lesson learned</div>
   </div>
 
   <div class="two-col">
     <div>
-      <div style="font-size:.78em; color:#a0aec0; font-style:italic; background:#1a202c; padding:12px; border-radius:8px; border:1px solid #2d3748; line-height:1.6;">
+      <div style="font-size:.76em; color:#a0aec0; font-style:italic; background:#1a202c; padding:10px 12px; border-radius:7px; border:1px solid #2d3748; line-height:1.6;">
         "…this is the second screen in a row where something obvious knocked the candidate out early. I feel like we could save everyone time if we checked those things right at the start of each call. Worth noting that pattern somewhere."
       </div>
     </div>
     <div>
-      <div class="callout purple" style="font-size:.78em;">
+      <div class="callout purple" style="font-size:.76em;">
         <strong>🔧 Procedural memory written</strong><br><br>
-        "Phone screen gate: (1) confirm work-auth in first 5 min, (2) ask candidate to explain Raft — weak answers correlate strongly with underperformance."
+        "Phone screen gate: (1) confirm work-auth in first 5 min, (2) ask candidate to explain Raft — weak answers correlate with underperformance on distributed systems work."
       </div>
     </div>
   </div>
 
-  <div class="callout yellow" style="margin-top:.8em; font-size:.8em;">
-    The recruiter didn't say "write a procedural memory." The agent recognized it as a reusable process and chose the right memory type.
+  <div class="callout yellow" style="margin-top:.7em; font-size:.78em;">
+    The recruiter said "worth noting." The agent recognised it as a reusable process and chose the right memory type without being asked.
   </div>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 13 — Phase 6: Charlie
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 15 · Charlie ══ -->
 <section>
   <div class="scenario-header">
     <div class="phase-badge">Phase 6</div>
-    <div class="phase-title">Recruiter Session — Charlie Kim</div>
+    <div class="phase-title">Recruiter — Charlie Kim (HIRE)</div>
   </div>
 
   <div class="two-col">
     <div>
-      <p style="font-size:.78em; color:#718096; margin-bottom:.4em;"><em>Before the screen</em></p>
-      <div style="font-size:.78em; color:#a0aec0; font-style:italic; background:#1a202c; padding:12px; border-radius:8px; border:1px solid #2d3748; line-height:1.6;">
+      <p style="font-size:.76em; color:#718096; margin-bottom:.3em;"><em>Before the screen</em></p>
+      <div style="font-size:.76em; color:#a0aec0; font-style:italic; background:#1a202c; padding:10px 12px; border-radius:7px; border:1px solid #2d3748; line-height:1.6;">
         "About to jump on a screen with Charlie Kim. Do we have anything on how to run these calls?"
       </div>
-      <div style="margin-top:10px; font-size:.78em; color:#48bb78;">
+      <div style="margin-top:8px; font-size:.76em; color:#48bb78; line-height:1.8;">
         → <code>memory_search("phone screen process")</code><br>
-        <span style="color:#718096; padding-left:16px;">Retrieves the checklist from Phase 5</span>
+        <span style="color:#718096; padding-left:14px;">Retrieves the gate checklist from Phase 5</span>
       </div>
     </div>
     <div>
-      <p style="font-size:.78em; color:#718096; margin-bottom:.4em;"><em>After the screen</em></p>
-      <div class="callout green" style="font-size:.77em; margin-bottom:6px;">
-        ✅ US citizen — work-auth clear (first question)
-      </div>
-      <div class="callout green" style="font-size:.77em; margin-bottom:6px;">
-        ✅ $140K ask — within the $100–150K band
-      </div>
-      <div class="callout green" style="font-size:.77em;">
-        ✅ Explained Raft + leader election edge cases unprompted
-      </div>
-      <p style="font-size:.75em; color:#48bb78; margin-top:.6em; font-weight:600;">→ Advancing to interview loop</p>
+      <p style="font-size:.76em; color:#718096; margin-bottom:.3em;"><em>Post-screen results</em></p>
+      <div class="callout green" style="font-size:.75em; margin-bottom:5px;">✅ US citizen — work-auth clear (first question)</div>
+      <div class="callout green" style="font-size:.75em; margin-bottom:5px;">✅ $140K ask — within $100–150K band</div>
+      <div class="callout green" style="font-size:.75em; margin-bottom:8px;">✅ Explained Raft + leader election edge cases unprompted</div>
+      <p style="font-size:.76em; color:#48bb78; font-weight:600; margin:0;">→ Advancing to interview loop</p>
     </div>
   </div>
 
-  <div class="callout" style="margin-top:.6em; font-size:.78em;">
-    The checklist was written by a <em>different agent session</em>. This session retrieved and applied it.
+  <div class="callout" style="margin-top:.6em; font-size:.77em;">
+    The checklist was written by a <em>different agent session</em>. This session retrieved and applied it cold.
   </div>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 14 — Phase 7: Crystallize
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 16 · Crystallize ══ -->
 <section>
   <div class="scenario-header">
     <div class="phase-badge">Phase 7</div>
-    <div class="phase-title">Crystallize — phone-screen pattern → reusable Skill</div>
+    <div class="phase-title">Crystallize — one week of screens → a reusable Skill</div>
   </div>
 
-  <div style="font-size:.78em; color:#a0aec0; font-style:italic; background:#1a202c; padding:10px 14px; border-radius:8px; border:1px solid #2d3748; margin-bottom:.8em;">
+  <div style="font-size:.76em; color:#a0aec0; font-style:italic; background:#1a202c; padding:9px 12px; border-radius:7px; border:1px solid #2d3748; margin-bottom:.7em; line-height:1.6;">
     "We've wrapped the first week of screens. I want to turn what we learned into something the whole recruiting team can reuse — a proper runbook for future phone screens."
   </div>
 
   <div class="two-col">
-    <div style="font-size:.78em; color:#a0aec0;">
-      <div style="color:#9f7aea; margin-bottom:4px;">Agent retrieves</div>
-      <div style="color:#718096; line-height:1.8;">
+    <div style="font-size:.78em;">
+      <div style="color:#9f7aea; margin-bottom:5px; font-weight:600;">Agent retrieves &amp; crystallizes</div>
+      <div style="color:#718096; line-height:2;">
         → <code>memory_list(type=procedural)</code><br>
         → <code>memory_search("phone screen patterns")</code><br>
-        → <code>memory_crystallize([ids…])</code>
+        → <code>memory_crystallize([ids…], name="...")</code>
       </div>
     </div>
     <div>
-      <div class="callout purple" style="font-size:.76em; line-height:1.6;">
+      <div class="callout purple" style="font-size:.75em; line-height:1.6;">
         <strong>Output: SKILL.md scaffold</strong><br>
         Knockout gates · Technical depth probe<br>
         Decision rubric · Post-call logging template<br><br>
-        Human authors it → <code>thv skills push</code> → OCI artifact.<br>
-        Procedural memories archived with <code>crystallized_into</code> pointer.
+        Human reviews → <code>thv skills push</code> → OCI artifact.<br>
+        Originals archived with <code>crystallized_into</code> pointer.
       </div>
     </div>
   </div>
 
-  <p style="font-size:.72em; color:#4a5568; margin-top:.6em;">One week of lived experience → a versioned, distributable runbook any recruiter can follow.</p>
+  <p style="font-size:.72em; color:#4a5568; margin-top:.5em; text-align:center;">One week of lived experience → a versioned runbook any recruiter can follow from day one.</p>
 </section>
 
-<!-- ══════════════════════════════════════════════════════════════
-     SLIDE 15 — Summary
-     ══════════════════════════════════════════════════════════════ -->
+<!-- ══════════════════════════════════════ 17 · Summary ══ -->
 <section>
   <h2>What We Just Saw</h2>
 
-  <ul class="phase-list" style="margin-top:.4em;">
+  <ul class="phase-list" style="margin-top:.3em; max-width:660px; margin-left:auto; margin-right:auto;">
     <li>
       <div class="phase-num" style="background:rgba(0,212,255,.1);">📄</div>
-      <div class="phase-text">
-        <strong>Resources</strong> — reference docs agents discover through MCP; never modified by agents
-      </div>
+      <div class="phase-text"><strong>Resource</strong> — reference docs agents discover through MCP; protected from modification</div>
     </li>
     <li>
       <div class="phase-num" style="background:rgba(72,187,120,.1);">🧠</div>
-      <div class="phase-text">
-        <strong>Semantic memory</strong> — company-wide facts written once, recalled by any session
-      </div>
+      <div class="phase-text"><strong>Semantic</strong> — company-wide facts written once, recalled by any session with no explicit handoff</div>
     </li>
     <li>
       <div class="phase-num" style="background:rgba(246,224,94,.1);">📅</div>
-      <div class="phase-text">
-        <strong>Episodic memory</strong> — time-indexed events building a shared pipeline log
-      </div>
+      <div class="phase-text"><strong>Episodic</strong> — time-indexed events building a shared pipeline log across recruiter sessions</div>
     </li>
     <li>
       <div class="phase-num" style="background:rgba(159,122,234,.1);">🔧</div>
-      <div class="phase-text">
-        <strong>Procedural memory</strong> — process knowledge that emerged from failure, retrieved by a different session
-      </div>
+      <div class="phase-text"><strong>Procedural</strong> — process knowledge that emerged from failure; retrieved by a session that never wrote it</div>
     </li>
     <li>
       <div class="phase-num" style="background:rgba(159,122,234,.1);">✨</div>
-      <div class="phase-text">
-        <strong>Crystallization</strong> — lived experience promoted into a versioned Skill runbook the whole team can use
-      </div>
+      <div class="phase-text"><strong>Crystallization</strong> — lived team experience promoted into a versioned Skill the whole org can distribute</div>
     </li>
   </ul>
 
-  <div class="callout" style="margin-top:.8em; font-size:.82em; text-align:center;">
+  <div class="callout" style="margin-top:.8em; font-size:.8em; text-align:center; max-width:600px; margin-left:auto; margin-right:auto;">
     Any Claude Code session. One MCP config file. Shared memory across the whole team.
   </div>
 </section>
 
+<!-- ══════════════════════════════════════ 18 · References ══ -->
+<section>
+  <h2>References</h2>
+  <div style="display:grid; grid-template-columns:1fr; gap:12px; max-width:640px; margin:0 auto;">
+    <div class="ref-card">
+      <div class="ref-title">A Survey on the Memory Mechanism of LLM-based Agents</div>
+      <div class="ref-venue">arXiv:2603.07670 · 2025</div>
+      <div class="ref-note">Taxonomy of memory types (sensory, short-term, long-term), memory operations lifecycle (acquire, manage, utilize), and analysis of failure modes. The "manage" phase — consolidation, conflict resolution, staleness — is the most neglected in practice.</div>
+    </div>
+    <div class="ref-card">
+      <div class="ref-title">The LinkedIn Generative AI Application Tech Stack: Personalization with Cognitive Memory Agent</div>
+      <div class="ref-venue">LinkedIn Engineering Blog · 2024</div>
+      <div class="ref-note">Production deployment of hierarchical episodic + aggregated semantic + procedural memory at LinkedIn scale. Trust-weighted retrieval, per-application isolation. Informed our comparison table and the decision to prioritise conflict detection and user control.</div>
+    </div>
+    <div class="ref-card">
+      <div class="ref-title">A Practical Guide to Implementing Memory in LLM Applications</div>
+      <div class="ref-venue">Towards Data Science · 2024</div>
+      <div class="ref-note">Practitioner analysis of memory degradation causes: staleness and trust neglect are the top two. Recommends human-authored memory to outrank agent-authored, and explicit staleness scoring — both implemented here.</div>
+    </div>
+  </div>
+</section>
+
 </div><!-- .slides -->
 </div><!-- .reveal -->
 
@@ -753,7 +844,8 @@ <h2>What We Just Saw</h2>
     backgroundTransition: 'none',
     width: 1100,
     height: 680,
-    margin: 0.06,
+    margin: 0.05,
+    center: false,
   });
 </script>
 </body>

From e96b36865d4a3e546942956ea829b15e819d43b8 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Wed, 29 Apr 2026 08:52:55 -0400
Subject: [PATCH 16/23] =?UTF-8?q?Fix=20slide=20overflow=20=E2=80=94=20cont?=
 =?UTF-8?q?ent=20no=20longer=20exceeds=20viewport?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Increase logical height 680→750 and tighten margin 0.05→0.04
  to give dense slides more breathing room
- Shrink ref-card padding/font and comparison table row padding
  so Research and References slides fit without clipping
- Reduce h2 and phase-list padding to reclaim vertical space
- Add tenant-isolation row to comparison table for completeness

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/slides.html | 119 ++++++++++++++++++++-----------------
 1 file changed, 64 insertions(+), 55 deletions(-)

diff --git a/demo/recruiter/slides.html b/demo/recruiter/slides.html
index 8efed57963..a916fb0d56 100644
--- a/demo/recruiter/slides.html
+++ b/demo/recruiter/slides.html
@@ -19,8 +19,8 @@
 
   .reveal { font-family: 'Segoe UI', system-ui, sans-serif; }
 
-  .reveal h1 { color: var(--cyan); font-size: 1.85em; margin-bottom: .25em; }
-  .reveal h2 { color: var(--cyan); font-size: 1.3em;  margin-bottom: .35em; }
+  .reveal h1 { color: var(--cyan); font-size: 1.85em; margin-bottom: .2em; }
+  .reveal h2 { color: var(--cyan); font-size: 1.25em; margin-bottom: .25em; }
   .reveal p, .reveal li { color: #cbd5e0; font-size: .86em; }
 
   .tag {
@@ -73,9 +73,9 @@
   /* phase list */
   .phase-list { list-style: none; padding: 0; margin: 0; }
   .phase-list li {
-    display: flex; align-items: flex-start; gap: 11px;
-    padding: 6px 0; border-bottom: 1px solid var(--dim);
-    font-size: .78em;
+    display: flex; align-items: flex-start; gap: 10px;
+    padding: 5px 0; border-bottom: 1px solid var(--dim);
+    font-size: .77em;
   }
   .phase-list li:last-child { border-bottom: none; }
   .phase-num {
@@ -109,13 +109,13 @@
     background: rgba(255,255,255,.04);
     border: 1px solid rgba(255,255,255,.1);
     border-radius: 8px;
-    padding: 12px 14px;
-    font-size: .74em;
-    line-height: 1.5;
+    padding: 9px 12px;
+    font-size: .73em;
+    line-height: 1.45;
   }
-  .ref-card .ref-title { color: #e2e8f0; font-weight: 600; margin-bottom: 3px; }
-  .ref-card .ref-venue { color: var(--cyan); font-size: .88em; }
-  .ref-card .ref-note  { color: #718096; font-size: .88em; margin-top: 4px; }
+  .ref-card .ref-title { color: #e2e8f0; font-weight: 600; margin-bottom: 2px; }
+  .ref-card .ref-venue { color: var(--cyan); font-size: .87em; }
+  .ref-card .ref-note  { color: #718096; font-size: .87em; margin-top: 3px; }
 
   /* section divider styling */
   .divider-slide { text-align: center; }
@@ -204,32 +204,32 @@ <h2>The Problem</h2>
 <!-- ══════════════════════════════════════ 3 · What Research Says ══ -->
 <section>
   <h2>What the Research Tells Us</h2>
-  <p style="color:#718096; margin-bottom:.7em;">Three bodies of work converge on the same failure modes.</p>
+  <p style="color:#718096; margin-bottom:.6em;">Three bodies of work converge on the same failure modes.</p>
 
-  <div style="display:grid; grid-template-columns:1fr 1fr 1fr; gap:12px; margin-bottom:.8em;">
+  <div style="display:grid; grid-template-columns:1fr 1fr 1fr; gap:10px; margin-bottom:.7em;">
     <div class="ref-card">
       <div class="ref-title">A Survey on the Memory Mechanism of LLM-based Agents</div>
-      <div class="ref-venue">arXiv 2603.07670</div>
-      <div class="ref-note">Most systems neglect the <em>manage</em> phase — consolidation, conflict resolution, and staleness tracking. Silent contradictions are the most common failure mode.</div>
+      <div class="ref-venue">arXiv 2603.07670 · 2025</div>
+      <div class="ref-note">Most systems neglect the <em>manage</em> phase — consolidation, conflict resolution, staleness. Silent contradictions are the most common failure mode.</div>
     </div>
     <div class="ref-card">
       <div class="ref-title">LinkedIn Cognitive Memory Agent (CMA)</div>
-      <div class="ref-venue">LinkedIn Engineering Blog</div>
-      <div class="ref-note">Hierarchical memory with episodic + semantic + procedural types. Trust-weighted retrieval and per-application tenant isolation in production at LinkedIn scale.</div>
+      <div class="ref-venue">LinkedIn Engineering Blog · 2024</div>
+      <div class="ref-note">Hierarchical episodic + semantic + procedural memory at LinkedIn scale. Trust-weighted retrieval and per-application tenant isolation in production.</div>
     </div>
     <div class="ref-card">
       <div class="ref-title">Practical Guide to LLM Memory Systems</div>
-      <div class="ref-venue">Towards Data Science</div>
-      <div class="ref-note">Trust differentiation between human-authored and agent-authored memories is widely neglected. Staleness is the second leading cause of retrieval degradation.</div>
+      <div class="ref-venue">Towards Data Science · 2024</div>
+      <div class="ref-note">Trust differentiation between human and agent memory is widely neglected. Staleness is the second leading cause of retrieval degradation.</div>
     </div>
   </div>
 
   <div style="display:grid; grid-template-columns:1fr 1fr; gap:10px;">
-    <div class="callout orange">
-      <strong>Key insight #1</strong> — Memory isn't just storage. Write, retrieval, <em>and management</em> all need first-class design.
+    <div class="callout orange" style="font-size:.76em;">
+      <strong>Key insight #1</strong> — Memory isn't just storage. Write, retrieval, <em>and management</em> (consolidation, conflict, staleness) all need first-class design.
     </div>
-    <div class="callout orange">
-      <strong>Key insight #2</strong> — Human-authored memories must outrank agent-authored ones. Agents can be wrong; humans correct.
+    <div class="callout orange" style="font-size:.76em;">
+      <strong>Key insight #2</strong> — Human-authored memories must outrank agent-authored ones. Trust differentiation is the most neglected dimension in practice.
     </div>
   </div>
 </section>
@@ -237,51 +237,60 @@ <h2>What the Research Tells Us</h2>
 <!-- ══════════════════════════════════════ 4 · Our Approach ══ -->
 <section>
   <h2>Our Approach vs. the Literature</h2>
-  <p style="color:#718096; margin-bottom:.6em;">Where we are ahead, and where we deliberately differ.</p>
 
-  <div style="font-size:.78em; width:100%;">
+  <div style="font-size:.76em; width:100%; margin-top:.3em;">
     <table style="width:100%; border-collapse:collapse; color:#cbd5e0;">
       <thead>
-        <tr style="border-bottom:1px solid #2d3748;">
-          <th style="text-align:left; padding:6px 8px; color:#718096; font-weight:600; width:26%;">Dimension</th>
-          <th style="text-align:left; padding:6px 8px; color:#718096; font-weight:600; width:37%;">LinkedIn CMA</th>
-          <th style="text-align:left; padding:6px 8px; color:var(--cyan); font-weight:600;">ToolHive Memory</th>
+        <tr style="border-bottom:1px solid #2d3748; background:rgba(255,255,255,.03);">
+          <th style="text-align:left; padding:5px 10px; color:#718096; font-weight:600; width:24%;">Dimension</th>
+          <th style="text-align:left; padding:5px 10px; color:#718096; font-weight:600; width:36%;">LinkedIn CMA</th>
+          <th style="text-align:left; padding:5px 10px; color:var(--cyan); font-weight:600;">ToolHive Memory</th>
         </tr>
       </thead>
       <tbody>
         <tr style="border-bottom:1px solid #1a202c;">
-          <td style="padding:5px 8px; color:#a0aec0;">Conflict detection</td>
-          <td style="padding:5px 8px; color:#718096;">On roadmap</td>
-          <td style="padding:5px 8px; color:var(--green);">✅ Built — cosine sim &gt; 0.85 on write</td>
+          <td style="padding:4px 10px; color:#a0aec0;">Conflict detection</td>
+          <td style="padding:4px 10px; color:#718096;">On roadmap</td>
+          <td style="padding:4px 10px; color:var(--green);">✅ Built — cosine sim &gt; 0.85 on write</td>
         </tr>
         <tr style="border-bottom:1px solid #1a202c;">
-          <td style="padding:5px 8px; color:#a0aec0;">Trust / staleness</td>
-          <td style="padding:5px 8px; color:#718096;">Time-based, on roadmap</td>
-          <td style="padding:5px 8px; color:var(--green);">✅ Built — formula + 24h background job</td>
+          <td style="padding:4px 10px; color:#a0aec0;">Trust / staleness</td>
+          <td style="padding:4px 10px; color:#718096;">Time-based, on roadmap</td>
+          <td style="padding:4px 10px; color:var(--green);">✅ Built — formula + 24 h background job</td>
         </tr>
         <tr style="border-bottom:1px solid #1a202c;">
-          <td style="padding:5px 8px; color:#a0aec0;">User control</td>
-          <td style="padding:5px 8px; color:#718096;">Planned</td>
-          <td style="padding:5px 8px; color:var(--green);">✅ list, update, flag, forget</td>
+          <td style="padding:4px 10px; color:#a0aec0;">User control</td>
+          <td style="padding:4px 10px; color:#718096;">Planned</td>
+          <td style="padding:4px 10px; color:var(--green);">✅ list · update · flag · forget</td>
         </tr>
         <tr style="border-bottom:1px solid #1a202c;">
-          <td style="padding:5px 8px; color:#a0aec0;">Memory types</td>
-          <td style="padding:5px 8px; color:#718096;">Episodic + Semantic + Procedural</td>
-          <td style="padding:5px 8px; color:#e2e8f0;">Semantic + Episodic + Procedural + Resource</td>
+          <td style="padding:4px 10px; color:#a0aec0;">Memory types</td>
+          <td style="padding:4px 10px; color:#718096;">Episodic + Semantic + Procedural</td>
+          <td style="padding:4px 10px; color:#e2e8f0;">+ Resource (read-only reference docs)</td>
         </tr>
         <tr style="border-bottom:1px solid #1a202c;">
-          <td style="padding:5px 8px; color:#a0aec0;">Retrieval</td>
-          <td style="padding:5px 8px; color:#718096;">LLM-orchestrated multi-step</td>
-          <td style="padding:5px 8px; color:#e2e8f0;">Single-pass vector — agent IS the orchestrator</td>
+          <td style="padding:4px 10px; color:#a0aec0;">Retrieval</td>
+          <td style="padding:4px 10px; color:#718096;">LLM-orchestrated multi-step</td>
+          <td style="padding:4px 10px; color:#e2e8f0;">Single-pass vector — agent is the orchestrator</td>
+        </tr>
+        <tr style="border-bottom:1px solid #1a202c;">
+          <td style="padding:4px 10px; color:#a0aec0;">Crystallization</td>
+          <td style="padding:4px 10px; color:#718096;">Not described</td>
+          <td style="padding:4px 10px; color:var(--purple);">✅ Procedural → versioned Skill (OCI)</td>
         </tr>
         <tr>
-          <td style="padding:5px 8px; color:#a0aec0;">Crystallization</td>
-          <td style="padding:5px 8px; color:#718096;">Not described</td>
-          <td style="padding:5px 8px; color:var(--purple);">✅ Procedural → versioned Skill (OCI)</td>
+          <td style="padding:4px 10px; color:#a0aec0;">Tenant isolation</td>
+          <td style="padding:4px 10px; color:var(--green);">Per-application storage isolation</td>
+          <td style="padding:4px 10px; color:#718096;">Auth at proxy level — storage isolation on roadmap</td>
         </tr>
       </tbody>
     </table>
   </div>
+
+  <div class="callout" style="font-size:.73em; margin-top:.6em;">
+    We are <strong style="color:var(--green);">ahead</strong> on conflict detection, trust scoring, and user control.
+    LinkedIn is ahead on hierarchical aggregation and tenant isolation — both planned for a later phase.
+  </div>
 </section>
 
 <!-- ══════════════════════════════════════ PART 2 DIVIDER ══ -->
@@ -810,21 +819,21 @@ <h2>What We Just Saw</h2>
 <!-- ══════════════════════════════════════ 18 · References ══ -->
 <section>
   <h2>References</h2>
-  <div style="display:grid; grid-template-columns:1fr; gap:12px; max-width:640px; margin:0 auto;">
-    <div class="ref-card">
+  <div style="display:grid; grid-template-columns:1fr; gap:9px; max-width:680px; margin:.4em auto 0;">
+    <div class="ref-card" style="padding:10px 14px;">
       <div class="ref-title">A Survey on the Memory Mechanism of LLM-based Agents</div>
       <div class="ref-venue">arXiv:2603.07670 · 2025</div>
-      <div class="ref-note">Taxonomy of memory types (sensory, short-term, long-term), memory operations lifecycle (acquire, manage, utilize), and analysis of failure modes. The "manage" phase — consolidation, conflict resolution, staleness — is the most neglected in practice.</div>
+      <div class="ref-note">Taxonomy of memory types and operations lifecycle (acquire, manage, utilize). The "manage" phase — consolidation, conflict resolution, staleness — is the most neglected in practice. Informed our lifecycle design and the 24 h background job.</div>
     </div>
     <div class="ref-card">
       <div class="ref-title">The LinkedIn Generative AI Application Tech Stack: Personalization with Cognitive Memory Agent</div>
       <div class="ref-venue">LinkedIn Engineering Blog · 2024</div>
-      <div class="ref-note">Production deployment of hierarchical episodic + aggregated semantic + procedural memory at LinkedIn scale. Trust-weighted retrieval, per-application isolation. Informed our comparison table and the decision to prioritise conflict detection and user control.</div>
+      <div class="ref-note">Production deployment of hierarchical episodic + aggregated semantic + procedural memory at LinkedIn scale. Trust-weighted retrieval and per-application isolation. Informed our comparison table and the prioritisation of conflict detection and user control.</div>
     </div>
-    <div class="ref-card">
+    <div class="ref-card" style="padding:10px 14px;">
       <div class="ref-title">A Practical Guide to Implementing Memory in LLM Applications</div>
       <div class="ref-venue">Towards Data Science · 2024</div>
-      <div class="ref-note">Practitioner analysis of memory degradation causes: staleness and trust neglect are the top two. Recommends human-authored memory to outrank agent-authored, and explicit staleness scoring — both implemented here.</div>
+      <div class="ref-note">Practitioner analysis of memory degradation: staleness and trust neglect are the top two causes. Recommends human-authored memory outranking agent-authored, and explicit staleness scoring — both implemented here.</div>
     </div>
   </div>
 </section>
@@ -843,8 +852,8 @@ <h2>References</h2>
     transitionSpeed: 'fast',
     backgroundTransition: 'none',
     width: 1100,
-    height: 680,
-    margin: 0.05,
+    height: 750,
+    margin: 0.04,
     center: false,
   });
 </script>

From 4189ec05f3e191cbbc7fbe49930952faa3c1cc73 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Wed, 29 Apr 2026 09:05:23 -0400
Subject: [PATCH 17/23] Enable per-slide scrolling in Reveal.js presentation
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Reveal sets height:auto on section elements, so overflow-y:auto had
nothing to overflow against — the slides container clipped instead.
Fix: pin each section to the configured height (750px) via a ready
event handler, then let overflow-y:auto do its job. Adds a subtle
dark-themed scrollbar so it's unobtrusive during presentation.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/slides.html | 24 ++++++++++++++++++++++++
 1 file changed, 24 insertions(+)

diff --git a/demo/recruiter/slides.html b/demo/recruiter/slides.html
index a916fb0d56..ff6b2f519d 100644
--- a/demo/recruiter/slides.html
+++ b/demo/recruiter/slides.html
@@ -127,6 +127,20 @@
   }
 
   svg text { font-family: 'Segoe UI', system-ui, sans-serif; }
+
+  /* Allow individual slides to scroll when content exceeds the slide height.
+     Reveal sets height:auto on sections; the JS below pins them to the
+     configured height so overflow-y:auto actually triggers. */
+  .reveal .slides > section {
+    box-sizing: border-box;
+    overflow-y: auto;
+    /* custom scrollbar — subtle, dark-themed */
+    scrollbar-width: thin;
+    scrollbar-color: #4a5568 transparent;
+  }
+  .reveal .slides > section::-webkit-scrollbar { width: 5px; }
+  .reveal .slides > section::-webkit-scrollbar-track { background: transparent; }
+  .reveal .slides > section::-webkit-scrollbar-thumb { background: #4a5568; border-radius: 3px; }
 </style>
 </head>
 <body>
@@ -856,6 +870,16 @@ <h2>References</h2>
     margin: 0.04,
     center: false,
   });
+
+  // Pin each slide to the configured height so overflow-y:auto triggers.
+  // Reveal sets height:auto on <section> elements; without a fixed height the
+  // overflow property has nothing to overflow against and clipping wins.
+  Reveal.on('ready', () => {
+    const h = Reveal.getConfig().height;
+    document.querySelectorAll('.reveal .slides > section').forEach(el => {
+      el.style.height = h + 'px';
+    });
+  });
 </script>
 </body>
 </html>

From 0ba0935b03bbf0db3e09643cfc8b43fbffa313ee Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Wed, 29 Apr 2026 09:15:06 -0400
Subject: [PATCH 18/23] Improve architecture slide: pluggable backends +
 clearer MCP box
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Replace the three single-technology backend boxes with three
  labeled backend groups (Storage, Vector Store, Embedder), each
  showing the default option and all supported alternatives
- Remove 'goose migrations / Schema Manager' box — internal
  implementation detail with no meaning to an audience
- Memory Server box now shows the MCP transport badge and lists
  tools with a brief description of each (memory_remember,
  memory_search, memory_crystallize, resources/list)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/slides.html | 106 +++++++++++++++++++++++--------------
 1 file changed, 65 insertions(+), 41 deletions(-)

diff --git a/demo/recruiter/slides.html b/demo/recruiter/slides.html
index ff6b2f519d..7010c20ef9 100644
--- a/demo/recruiter/slides.html
+++ b/demo/recruiter/slides.html
@@ -319,9 +319,9 @@ <h1 style="font-size:1.7em;">Architecture</h1>
 <!-- ══════════════════════════════════════ 5 · Architecture ══ -->
 <section>
   <h2>Architecture</h2>
-  <p style="color:#718096; margin-bottom:.6em;">A shared MCP server — any agent session connects with one config file.</p>
+  <p style="color:#718096; margin-bottom:.5em;">A shared MCP server with fully pluggable storage, vector, and embedder backends.</p>
 
-  <svg viewBox="0 0 700 280" width="100%" style="max-width:680px; display:block; margin:0 auto;">
+  <svg viewBox="0 0 860 310" width="100%" style="display:block; margin:0 auto;">
     <defs>
       <marker id="arr-cyan" markerWidth="8" markerHeight="8" refX="6" refY="3" orient="auto">
         <path d="M0,0 L0,6 L8,3 z" fill="#00d4ff"/>
@@ -332,52 +332,76 @@ <h2>Architecture</h2>
     </defs>
 
     <!-- Sessions -->
-    <rect x="8"   y="26"  width="150" height="44" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
-    <text x="83"  y="45"  fill="#718096" font-size="9.5" text-anchor="middle">Claude Code</text>
-    <text x="83"  y="60"  fill="#00d4ff" font-size="11" font-weight="600" text-anchor="middle">Recruiter A</text>
+    <rect x="8"  y="30"  width="148" height="42" rx="7" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="82" y="48"  fill="#718096" font-size="9" text-anchor="middle">Claude Code</text>
+    <text x="82" y="62"  fill="#00d4ff" font-size="10.5" font-weight="600" text-anchor="middle">Recruiter A</text>
 
-    <rect x="8"   y="118" width="150" height="44" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
-    <text x="83"  y="137" fill="#718096" font-size="9.5" text-anchor="middle">Claude Code</text>
-    <text x="83"  y="152" fill="#00d4ff" font-size="11" font-weight="600" text-anchor="middle">Hiring Manager</text>
+    <rect x="8"  y="124" width="148" height="42" rx="7" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="82" y="142" fill="#718096" font-size="9" text-anchor="middle">Claude Code</text>
+    <text x="82" y="156" fill="#00d4ff" font-size="10.5" font-weight="600" text-anchor="middle">Hiring Manager</text>
 
-    <rect x="8"   y="210" width="150" height="44" rx="8" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
-    <text x="83"  y="229" fill="#718096" font-size="9.5" text-anchor="middle">Claude Code</text>
-    <text x="83"  y="244" fill="#00d4ff" font-size="11" font-weight="600" text-anchor="middle">Recruiter B</text>
+    <rect x="8"  y="218" width="148" height="42" rx="7" fill="#1a202c" stroke="#00d4ff" stroke-width="1.5"/>
+    <text x="82" y="236" fill="#718096" font-size="9" text-anchor="middle">Claude Code</text>
+    <text x="82" y="250" fill="#00d4ff" font-size="10.5" font-weight="600" text-anchor="middle">Recruiter B</text>
 
-    <!-- HTTP/MCP label -->
-    <text x="196" y="95" fill="#4a5568" font-size="9" text-anchor="middle">HTTP / MCP</text>
+    <text x="190" y="98" fill="#4a5568" font-size="8.5" text-anchor="middle">HTTP / MCP</text>
 
     <!-- Arrows to server -->
-    <line x1="160" y1="48"  x2="264" y2="120" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
-    <line x1="160" y1="140" x2="264" y2="140" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
-    <line x1="160" y1="232" x2="264" y2="160" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
+    <line x1="158" y1="51"  x2="262" y2="124" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
+    <line x1="158" y1="145" x2="262" y2="145" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
+    <line x1="158" y1="239" x2="262" y2="166" stroke="#00d4ff" stroke-width="1.5" marker-end="url(#arr-cyan)"/>
 
     <!-- Memory Server -->
-    <rect x="270" y="88" width="178" height="104" rx="10" fill="#0d1f2d" stroke="#00d4ff" stroke-width="2"/>
-    <text x="359" y="108" fill="#00d4ff" font-size="11" font-weight="700" text-anchor="middle">Memory Server</text>
-    <line x1="290" y1="115" x2="428" y2="115" stroke="#1a3a4a" stroke-width="1"/>
-    <text x="359" y="130" fill="#718096" font-size="9" text-anchor="middle">memory_remember / search</text>
-    <text x="359" y="144" fill="#718096" font-size="9" text-anchor="middle">memory_crystallize / flag</text>
-    <text x="359" y="158" fill="#718096" font-size="9" text-anchor="middle">resources/list · api/resources</text>
-    <text x="359" y="178" fill="#4a5568" font-size="8.5" text-anchor="middle">MCP Streamable HTTP</text>
-
-    <!-- Arrows to backends -->
-    <line x1="450" y1="112" x2="530" y2="68"  stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
-    <line x1="450" y1="140" x2="530" y2="140" stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
-    <line x1="450" y1="168" x2="530" y2="212" stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
-
-    <!-- Backends -->
-    <rect x="536" y="38"  width="155" height="44" rx="7" fill="#1a202c" stroke="#48bb78" stroke-width="1.5"/>
-    <text x="613" y="57"  fill="#718096" font-size="9.5" text-anchor="middle">SQLite + sqlite-vec</text>
-    <text x="613" y="72"  fill="#48bb78" font-size="11" font-weight="600" text-anchor="middle">Storage + Vectors</text>
-
-    <rect x="536" y="118" width="155" height="44" rx="7" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
-    <text x="613" y="137" fill="#718096" font-size="9.5" text-anchor="middle">goose migrations</text>
-    <text x="613" y="152" fill="#9f7aea" font-size="11" font-weight="600" text-anchor="middle">Schema Manager</text>
-
-    <rect x="536" y="198" width="155" height="44" rx="7" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
-    <text x="613" y="217" fill="#718096" font-size="9.5" text-anchor="middle">nomic-embed-text</text>
-    <text x="613" y="232" fill="#f6e05e" font-size="11" font-weight="600" text-anchor="middle">Ollama Embedder</text>
+    <rect x="268" y="88" width="176" height="114" rx="9" fill="#0d1f2d" stroke="#00d4ff" stroke-width="2"/>
+    <!-- title + transport badge -->
+    <text x="356" y="106" fill="#00d4ff" font-size="11" font-weight="700" text-anchor="middle">Memory Server</text>
+    <rect x="290" y="110" width="132" height="14" rx="4" fill="rgba(0,212,255,.1)" stroke="rgba(0,212,255,.3)" stroke-width="1"/>
+    <text x="356" y="121" fill="#00d4ff" font-size="7.5" font-weight="600" text-anchor="middle" letter-spacing="0.08em">MCP · STREAMABLE HTTP</text>
+    <!-- MCP Tools label -->
+    <text x="283" y="137" fill="#4a5568" font-size="7.5" font-weight="600" letter-spacing="0.06em">MCP TOOLS</text>
+    <line x1="283" y1="140" x2="432" y2="140" stroke="#1a3a4a" stroke-width="1"/>
+    <!-- tool list -->
+    <text x="289" y="153" fill="#a0aec0" font-size="8.5">memory_remember</text>
+    <text x="380" y="153" fill="#718096" font-size="8">store + conflict check</text>
+    <text x="289" y="165" fill="#a0aec0" font-size="8.5">memory_search</text>
+    <text x="380" y="165" fill="#718096" font-size="8">vector similarity query</text>
+    <text x="289" y="177" fill="#a0aec0" font-size="8.5">memory_crystallize</text>
+    <text x="380" y="177" fill="#718096" font-size="8">→ Skill scaffold</text>
+    <text x="289" y="189" fill="#a0aec0" font-size="8.5">resources/list · flag · forget</text>
+
+    <!-- Arrows to backend groups -->
+    <line x1="446" y1="118" x2="516" y2="60"  stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
+    <line x1="446" y1="145" x2="516" y2="145" stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
+    <line x1="446" y1="172" x2="516" y2="230" stroke="#48bb78" stroke-width="1.5" marker-end="url(#arr-green)"/>
+
+    <!-- ── Storage backend ── -->
+    <rect x="522" y="18" width="320" height="74" rx="7" fill="#1a202c" stroke="#48bb78" stroke-width="1.5"/>
+    <text x="536" y="36"  fill="#48bb78" font-size="10" font-weight="700">💾  Storage</text>
+    <!-- default pill -->
+    <rect x="682" y="22" width="74" height="16" rx="8" fill="rgba(72,187,120,.15)" stroke="#48bb78" stroke-width="1"/>
+    <text x="719" y="34" fill="#48bb78" font-size="8" font-weight="600" text-anchor="middle">default</text>
+    <!-- options -->
+    <text x="536" y="52"  fill="#e2e8f0" font-size="9.5">SQLite + sqlite-vec</text>
+    <text x="536" y="67"  fill="#4a5568" font-size="9">also: PostgreSQL + pgvector  ·  Qdrant  ·  Weaviate  ·  Pinecone</text>
+    <text x="536" y="82"  fill="#4a5568" font-size="8.5" font-style="italic">swap provider in memory-server.yaml — no code changes</text>
+
+    <!-- ── Vector Store backend ── -->
+    <rect x="522" y="108" width="320" height="74" rx="7" fill="#1a202c" stroke="#9f7aea" stroke-width="1.5"/>
+    <text x="536" y="126" fill="#9f7aea" font-size="10" font-weight="700">🔍  Vector Store</text>
+    <rect x="682" y="112" width="74" height="16" rx="8" fill="rgba(159,122,234,.15)" stroke="#9f7aea" stroke-width="1"/>
+    <text x="719" y="124" fill="#9f7aea" font-size="8" font-weight="600" text-anchor="middle">default</text>
+    <text x="536" y="142" fill="#e2e8f0" font-size="9.5">sqlite-vec  (embedded, zero infra)</text>
+    <text x="536" y="157" fill="#4a5568" font-size="9">also: Qdrant  ·  pgvector  ·  Weaviate  ·  Pinecone</text>
+    <text x="536" y="172" fill="#4a5568" font-size="8.5" font-style="italic">PostgreSQL + pgvector collapses storage + vector into one</text>
+
+    <!-- ── Embedder backend ── -->
+    <rect x="522" y="198" width="320" height="74" rx="7" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
+    <text x="536" y="216" fill="#f6e05e" font-size="10" font-weight="700">🔤  Embedder</text>
+    <rect x="682" y="202" width="74" height="16" rx="8" fill="rgba(246,224,94,.15)" stroke="#f6e05e" stroke-width="1"/>
+    <text x="719" y="214" fill="#f6e05e" font-size="8" font-weight="600" text-anchor="middle">default</text>
+    <text x="536" y="232" fill="#e2e8f0" font-size="9.5">Ollama  (local, nomic-embed-text)</text>
+    <text x="536" y="247" fill="#4a5568" font-size="9">also: OpenAI  ·  Cohere  ·  Google Vertex AI</text>
+    <text x="536" y="262" fill="#4a5568" font-size="8.5" font-style="italic">teams with no local GPU use OpenAI or Cohere with zero changes</text>
   </svg>
 </section>
 

From f75e65cae58cc93023d6d69cb2237e160f92b39d Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Wed, 29 Apr 2026 18:57:04 -0400
Subject: [PATCH 19/23] Title slide: surface 'manage' alongside write and
 search
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The manage phase (flag, update, consolidate, crystallize) is the
most differentiated part of the design — the research explicitly
calls it the most neglected dimension. It deserves equal billing
from the very first slide.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/slides.html | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/demo/recruiter/slides.html b/demo/recruiter/slides.html
index 7010c20ef9..10f4e6e928 100644
--- a/demo/recruiter/slides.html
+++ b/demo/recruiter/slides.html
@@ -151,9 +151,12 @@
 <section>
   <h1 style="font-size:2.1em; margin-bottom:.15em;">ToolHive Memory</h1>
   <p style="font-size:1em; color:var(--cyan); margin-bottom:1.1em;">Agentic Shared Memory for Teams</p>
-  <p style="color:#718096; font-size:.8em; max-width:560px; margin:0 auto 1.4em;">
-    A persistent, queryable memory layer that any Claude Code session<br>
-    can read and write — through a standard MCP interface.
+  <p style="color:#718096; font-size:.8em; max-width:580px; margin:0 auto 1.4em;">
+    A persistent memory layer that any Claude Code session can
+    <strong style="color:#e2e8f0;">write</strong>,
+    <strong style="color:#e2e8f0;">search</strong>, and
+    <strong style="color:#e2e8f0;">manage</strong> —
+    through a standard MCP interface.
   </p>
   <div style="font-size:.7em;">
     <span class="tag tag-cyan">MCP</span>

From f4a92421983b00b563e83d9882529489d232d63f Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Thu, 30 Apr 2026 11:15:47 -0400
Subject: [PATCH 20/23] Add hierarchical memory roadmap slide
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Shows current tag-based workaround vs the planned namespace isolation
approach, with a three-tier diagram (global → team → project). Explains
that the proxy stamps the namespace from OIDC context so agents never
set it themselves — one schema migration, no API surface change.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/slides.html | 110 ++++++++++++++++++++++++++++++++++++-
 1 file changed, 109 insertions(+), 1 deletion(-)

diff --git a/demo/recruiter/slides.html b/demo/recruiter/slides.html
index 10f4e6e928..6ac343e0b0 100644
--- a/demo/recruiter/slides.html
+++ b/demo/recruiter/slides.html
@@ -322,7 +322,11 @@ <h1 style="font-size:1.7em;">Architecture</h1>
 <!-- ══════════════════════════════════════ 5 · Architecture ══ -->
 <section>
   <h2>Architecture</h2>
-  <p style="color:#718096; margin-bottom:.5em;">A shared MCP server with fully pluggable storage, vector, and embedder backends.</p>
+  <p style="color:#718096; margin-bottom:.5em;">
+    Memory is a <strong style="color:#e2e8f0;">system workload</strong> inside ToolHive —
+    auto-provisioned, singleton per scope, excluded from <code>thv stop --all</code>.
+    Fully pluggable storage, vector, and embedder backends.
+  </p>
 
   <svg viewBox="0 0 860 310" width="100%" style="display:block; margin:0 auto;">
     <defs>
@@ -406,6 +410,110 @@ <h2>Architecture</h2>
     <text x="536" y="247" fill="#4a5568" font-size="9">also: OpenAI  ·  Cohere  ·  Google Vertex AI</text>
     <text x="536" y="262" fill="#4a5568" font-size="8.5" font-style="italic">teams with no local GPU use OpenAI or Cohere with zero changes</text>
   </svg>
+
+  <!-- Deployment modes -->
+  <div style="display:grid; grid-template-columns:1fr 1fr 1fr; gap:10px; margin-top:.6em;">
+    <div style="background:rgba(0,212,255,.05); border:1px solid rgba(0,212,255,.2); border-radius:8px; padding:10px 12px;">
+      <div style="font-size:.78em; font-weight:700; color:var(--cyan); margin-bottom:4px;">💻  Local (thv CLI)</div>
+      <div style="font-size:.7em; color:#718096; line-height:1.5;">
+        <code style="color:#a0aec0;">thv memory init</code><br>
+        Personal memory, local container.<br>
+        SQLite + sqlite-vec defaults.<br>
+        State in <code>~/.local/state/toolhive/</code>
+      </div>
+    </div>
+    <div style="background:rgba(72,187,120,.05); border:1px solid rgba(72,187,120,.2); border-radius:8px; padding:10px 12px;">
+      <div style="font-size:.78em; font-weight:700; color:var(--green); margin-bottom:4px;">👥  Team (thv serve)</div>
+      <div style="font-size:.7em; color:#718096; line-height:1.5;">
+        Shared instance, all agents connect<br>
+        through the ToolHive API proxy.<br>
+        Auth via existing OIDC middleware.<br>
+        Postgres + Qdrant recommended.
+      </div>
+    </div>
+    <div style="background:rgba(159,122,234,.05); border:1px solid rgba(159,122,234,.2); border-radius:8px; padding:10px 12px;">
+      <div style="font-size:.78em; font-weight:700; color:var(--purple); margin-bottom:4px;">☸️  Kubernetes (thv-operator)</div>
+      <div style="font-size:.7em; color:#718096; line-height:1.5;">
+        <code style="color:#a0aec0;">MCPMemoryServer</code> CRD.<br>
+        Operator reconciles → Deployment<br>
+        + Service + PVC automatically.<br>
+        Registered in MCPRegistry.
+      </div>
+    </div>
+  </div>
+</section>
+
+<!-- ══════════════════════════════════════ 5b · Hierarchical Memory ══ -->
+<section>
+  <h2>Hierarchical Memory <span style="font-size:.6em; color:var(--orange); vertical-align:middle; margin-left:8px;">roadmap</span></h2>
+  <p style="color:#718096; margin-bottom:.7em;">
+    Today memory is a flat namespace. The path to layered, scope-aware memory is well defined.
+  </p>
+
+  <div class="two-col" style="gap:24px; margin-bottom:.7em;">
+    <!-- Left: today -->
+    <div>
+      <p style="font-size:.75em; color:#718096; margin-bottom:.4em; font-weight:600; letter-spacing:.05em;">TODAY — tags as a workaround</p>
+      <div style="background:#1a202c; border:1px solid #2d3748; border-radius:8px; padding:12px 14px; font-size:.75em; color:#a0aec0; line-height:1.8;">
+        Tag memories with a project label:<br>
+        <code style="color:var(--cyan);">tags: ["project:payments"]</code><br><br>
+        Filter in search:<br>
+        <code style="color:var(--cyan);">memory_search("auth", tags=["project:payments"])</code><br><br>
+        <span style="color:#4a5568;">⚠ Convention only — no enforcement.<br>
+        An unfiltered search still returns everything.</span>
+      </div>
+    </div>
+
+    <!-- Right: roadmap -->
+    <div>
+      <p style="font-size:.75em; color:var(--orange); margin-bottom:.4em; font-weight:600; letter-spacing:.05em;">ROADMAP — namespace isolation</p>
+      <div style="background:rgba(237,137,54,.05); border:1px solid rgba(237,137,54,.2); border-radius:8px; padding:12px 14px; font-size:.75em; color:#a0aec0; line-height:1.8;">
+        Add <code style="color:var(--orange);">Namespace</code> to every entry.<br>
+        Proxy stamps it from OIDC token or project context — agents never set it.<br><br>
+        Search walks up the hierarchy:<br>
+        <span style="color:var(--orange);">project</span> → <span style="color:var(--yellow);">team</span> → <span style="color:var(--green);">global</span><br><br>
+        <span style="color:#718096;">One schema migration. No API surface change.</span>
+      </div>
+    </div>
+  </div>
+
+  <!-- Hierarchy diagram -->
+  <svg viewBox="0 0 680 130" width="100%" style="display:block; margin:0 auto;">
+    <defs>
+      <marker id="arr-h" markerWidth="7" markerHeight="7" refX="5" refY="3" orient="auto">
+        <path d="M0,0 L0,6 L7,3 z" fill="#4a5568"/>
+      </marker>
+    </defs>
+
+    <!-- Global -->
+    <rect x="240" y="8" width="200" height="34" rx="7" fill="#1a202c" stroke="#48bb78" stroke-width="1.5"/>
+    <text x="340" y="23" fill="#48bb78" font-size="10" font-weight="700" text-anchor="middle">🌍  global</text>
+    <text x="340" y="36" fill="#718096" font-size="8.5" text-anchor="middle">company policies · salary bands · shared skills</text>
+
+    <!-- Lines down -->
+    <line x1="290" y1="42" x2="160" y2="68" stroke="#4a5568" stroke-width="1.2" marker-end="url(#arr-h)"/>
+    <line x1="340" y1="42" x2="340" y2="68" stroke="#4a5568" stroke-width="1.2" marker-end="url(#arr-h)"/>
+    <line x1="390" y1="42" x2="520" y2="68" stroke="#4a5568" stroke-width="1.2" marker-end="url(#arr-h)"/>
+
+    <!-- Team -->
+    <rect x="60"  y="70" width="190" height="34" rx="7" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
+    <text x="155" y="85" fill="#f6e05e" font-size="10" font-weight="700" text-anchor="middle">👥  team: platform-eng</text>
+    <text x="155" y="98" fill="#718096" font-size="8.5" text-anchor="middle">infra patterns · on-call runbooks</text>
+
+    <rect x="245" y="70" width="190" height="34" rx="7" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
+    <text x="340" y="85" fill="#f6e05e" font-size="10" font-weight="700" text-anchor="middle">👥  team: recruiting</text>
+    <text x="340" y="98" fill="#718096" font-size="8.5" text-anchor="middle">pipeline · comp bands · interview SOP</text>
+
+    <rect x="430" y="70" width="190" height="34" rx="7" fill="#1a202c" stroke="#f6e05e" stroke-width="1.5"/>
+    <text x="525" y="85" fill="#f6e05e" font-size="10" font-weight="700" text-anchor="middle">👥  team: security</text>
+    <text x="525" y="98" fill="#718096" font-size="8.5" text-anchor="middle">threat models · CVE notes</text>
+
+    <!-- Project lines -->
+    <line x1="120" y1="104" x2="80"  y2="116" stroke="#4a5568" stroke-width="1" stroke-dasharray="3,3"/>
+    <line x1="190" y1="104" x2="230" y2="116" stroke="#4a5568" stroke-width="1" stroke-dasharray="3,3"/>
+    <text x="80"  y="127" fill="#4a5568" font-size="8" text-anchor="middle">project: thv-memory</text>
+    <text x="230" y="127" fill="#4a5568" font-size="8" text-anchor="middle">project: operator</text>
+  </svg>
 </section>
 
 <!-- ══════════════════════════════════════ 6 · Memory Types ══ -->

From 74136adbaa82c6f657048e30d662dad8d36b82f1 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Thu, 30 Apr 2026 13:07:42 -0400
Subject: [PATCH 21/23] Add five design tensions slide from arXiv 2603.07670
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Placed between the research sources slide and the comparison table
so the tensions motivate the design choices that follow. Each row
shows the tension name, the competing forces, and where ToolHive
Memory lands — Utility/Efficiency, Faithfulness/Adaptivity,
Adaptivity/Stability, Efficiency, and Governance.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/slides.html | 91 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 91 insertions(+)

diff --git a/demo/recruiter/slides.html b/demo/recruiter/slides.html
index 6ac343e0b0..17ea6e27ec 100644
--- a/demo/recruiter/slides.html
+++ b/demo/recruiter/slides.html
@@ -251,6 +251,97 @@ <h2>What the Research Tells Us</h2>
   </div>
 </section>
 
+<!-- ══════════════════════════════════════ 3b · Five Tensions ══ -->
+<section>
+  <h2>Five Design Tensions</h2>
+  <p style="color:#718096; margin-bottom:.6em; font-size:.82em;">
+    Every memory system is pulled along five axes that tug in opposite directions.
+    The right balance shifts with the application — a medical triage agent operates under a very different
+    faithfulness–efficiency frontier than a recipe recommender.
+    <em style="color:#4a5568;">(arXiv 2603.07670)</em>
+  </p>
+
+  <!-- tension rows -->
+  <div style="display:flex; flex-direction:column; gap:7px; max-width:900px; margin:0 auto;">
+
+    <!-- Utility vs Efficiency -->
+    <div style="display:grid; grid-template-columns:130px 1fr 1fr; gap:0; align-items:center; background:rgba(255,255,255,.03); border:1px solid rgba(255,255,255,.07); border-radius:8px; overflow:hidden;">
+      <div style="padding:9px 12px; background:rgba(0,212,255,.07); border-right:1px solid rgba(255,255,255,.07);">
+        <div style="font-size:.78em; font-weight:700; color:var(--cyan);">⚡  Utility</div>
+        <div style="font-size:.68em; color:#4a5568; margin-top:2px;">vs Efficiency</div>
+      </div>
+      <div style="padding:9px 14px; border-right:1px solid rgba(255,255,255,.07);">
+        <div style="font-size:.72em; color:#718096; line-height:1.4;">Maximising utility tempts you to store everything — bloating storage and retrieval cost. Aggressive compression silently discards the one rare fact that matters three weeks later.</div>
+      </div>
+      <div style="padding:9px 14px;">
+        <div style="font-size:.72em; color:#a0aec0; line-height:1.4;">Store semantically compressed memories, not raw transcripts. Trust scores surface high-value entries first so retrieval cost stays bounded.</div>
+      </div>
+    </div>
+
+    <!-- Faithfulness -->
+    <div style="display:grid; grid-template-columns:130px 1fr 1fr; gap:0; align-items:center; background:rgba(255,255,255,.03); border:1px solid rgba(255,255,255,.07); border-radius:8px; overflow:hidden;">
+      <div style="padding:9px 12px; background:rgba(72,187,120,.07); border-right:1px solid rgba(255,255,255,.07);">
+        <div style="font-size:.78em; font-weight:700; color:var(--green);">🎯  Faithfulness</div>
+        <div style="font-size:.68em; color:#4a5568; margin-top:2px;">vs Adaptivity</div>
+      </div>
+      <div style="padding:9px 14px; border-right:1px solid rgba(255,255,255,.07);">
+        <div style="font-size:.72em; color:#718096; line-height:1.4;">Stale or hallucinated recall can be worse than no recall at all. But locking down memory prevents it from reflecting a world that changes.</div>
+      </div>
+      <div style="padding:9px 14px;">
+        <div style="font-size:.72em; color:#a0aec0; line-height:1.4;">Conflict detection on write. Staleness scoring updated every 24h. Human-authored entries always outrank agent entries. Correction history preserved.</div>
+      </div>
+    </div>
+
+    <!-- Adaptivity -->
+    <div style="display:grid; grid-template-columns:130px 1fr 1fr; gap:0; align-items:center; background:rgba(255,255,255,.03); border:1px solid rgba(255,255,255,.07); border-radius:8px; overflow:hidden;">
+      <div style="padding:9px 12px; background:rgba(246,224,94,.07); border-right:1px solid rgba(255,255,255,.07);">
+        <div style="font-size:.78em; font-weight:700; color:var(--yellow);">🔄  Adaptivity</div>
+        <div style="font-size:.68em; color:#4a5568; margin-top:2px;">vs Stability</div>
+      </div>
+      <div style="padding:9px 14px; border-right:1px solid rgba(255,255,255,.07);">
+        <div style="font-size:.72em; color:#718096; line-height:1.4;">Memory that updates freely drifts — an agent can overwrite good knowledge with a bad observation. Full retrains are expensive and disrupt continuity.</div>
+      </div>
+      <div style="padding:9px 14px;">
+        <div style="font-size:.72em; color:#a0aec0; line-height:1.4;">Incremental writes via <code>memory_remember</code>. Updates create a revision history — nothing is ever silently overwritten. Flag + review before trust score recovers.</div>
+      </div>
+    </div>
+
+    <!-- Efficiency -->
+    <div style="display:grid; grid-template-columns:130px 1fr 1fr; gap:0; align-items:center; background:rgba(255,255,255,.03); border:1px solid rgba(255,255,255,.07); border-radius:8px; overflow:hidden;">
+      <div style="padding:9px 12px; background:rgba(237,137,54,.07); border-right:1px solid rgba(255,255,255,.07);">
+        <div style="font-size:.78em; font-weight:700; color:var(--orange);">📊  Efficiency</div>
+        <div style="font-size:.68em; color:#4a5568; margin-top:2px;">latency · tokens · storage</div>
+      </div>
+      <div style="padding:9px 14px; border-right:1px solid rgba(255,255,255,.07);">
+        <div style="font-size:.72em; color:#718096; line-height:1.4;">Every retrieved memory costs tokens in the context window. Large retrieval sets slow inference and dilute relevance. Embedding calls add latency on every write.</div>
+      </div>
+      <div style="padding:9px 14px;">
+        <div style="font-size:.72em; color:#a0aec0; line-height:1.4;">Embed once on write, never on read. Single-pass vector search with configurable <code>top_k</code>. TTL-based expiry keeps the store bounded. Score-weighted ranking cuts noise.</div>
+      </div>
+    </div>
+
+    <!-- Governance -->
+    <div style="display:grid; grid-template-columns:130px 1fr 1fr; gap:0; align-items:center; background:rgba(255,255,255,.03); border:1px solid rgba(255,255,255,.07); border-radius:8px; overflow:hidden;">
+      <div style="padding:9px 12px; background:rgba(159,122,234,.07); border-right:1px solid rgba(255,255,255,.07);">
+        <div style="font-size:.78em; font-weight:700; color:var(--purple);">🏛️  Governance</div>
+        <div style="font-size:.68em; color:#4a5568; margin-top:2px;">privacy · deletion · policy</div>
+      </div>
+      <div style="padding:9px 14px; border-right:1px solid rgba(255,255,255,.07);">
+        <div style="font-size:.72em; color:#718096; line-height:1.4;">Memory systems accumulate sensitive data. Without explicit deletion and access controls, memory becomes a liability — agents can recall things they shouldn't.</div>
+      </div>
+      <div style="padding:9px 14px;">
+        <div style="font-size:.72em; color:#a0aec0; line-height:1.4;">Explicit <code>memory_forget</code>. Agents can only delete their own entries; humans can delete any. TTL for automatic expiry. Read-only Resources protected by <code>ErrReadOnly</code>.</div>
+      </div>
+    </div>
+
+  </div>
+
+  <div style="display:grid; grid-template-columns:1fr 1fr; gap:10px; margin-top:.6em; max-width:900px; margin-left:auto; margin-right:auto;">
+    <div style="font-size:.68em; color:#4a5568; padding:0 4px; font-style:italic; text-align:center;">Tension</div>
+    <div style="font-size:.68em; color:#4a5568; padding:0 4px; font-style:italic; text-align:center;">Our position</div>
+  </div>
+</section>
+
 <!-- ══════════════════════════════════════ 4 · Our Approach ══ -->
 <section>
   <h2>Our Approach vs. the Literature</h2>

From db4baa1ded55690c78d1cad4bd1f8381b7948fb9 Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Thu, 30 Apr 2026 16:02:20 -0400
Subject: [PATCH 22/23] Rename title slide subtitle to emphasize cross-session
 persistence

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/slides.html | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/demo/recruiter/slides.html b/demo/recruiter/slides.html
index 17ea6e27ec..ada5b9a45b 100644
--- a/demo/recruiter/slides.html
+++ b/demo/recruiter/slides.html
@@ -150,7 +150,7 @@
 <!-- ══════════════════════════════════════ 1 · Title ══ -->
 <section>
   <h1 style="font-size:2.1em; margin-bottom:.15em;">ToolHive Memory</h1>
-  <p style="font-size:1em; color:var(--cyan); margin-bottom:1.1em;">Agentic Shared Memory for Teams</p>
+  <p style="font-size:1em; color:var(--cyan); margin-bottom:1.1em;">Persistent Memory Across Agent Sessions</p>
   <p style="color:#718096; font-size:.8em; max-width:580px; margin:0 auto 1.4em;">
     A persistent memory layer that any Claude Code session can
     <strong style="color:#e2e8f0;">write</strong>,

From 9bb592fd927bfcc8bed3f1bf1e7557f6ccbd63aa Mon Sep 17 00:00:00 2001
From: Reynier Ortiz Vega <reynier@stacklok.com>
Date: Thu, 30 Apr 2026 16:03:05 -0400
Subject: [PATCH 23/23] Generalize agent references from Claude Code to any MCP
 agent

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 demo/recruiter/slides.html | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/demo/recruiter/slides.html b/demo/recruiter/slides.html
index ada5b9a45b..0170bfb5f6 100644
--- a/demo/recruiter/slides.html
+++ b/demo/recruiter/slides.html
@@ -152,7 +152,7 @@
   <h1 style="font-size:2.1em; margin-bottom:.15em;">ToolHive Memory</h1>
   <p style="font-size:1em; color:var(--cyan); margin-bottom:1.1em;">Persistent Memory Across Agent Sessions</p>
   <p style="color:#718096; font-size:.8em; max-width:580px; margin:0 auto 1.4em;">
-    A persistent memory layer that any Claude Code session can
+    A persistent memory layer that any MCP-compatible agent can
     <strong style="color:#e2e8f0;">write</strong>,
     <strong style="color:#e2e8f0;">search</strong>, and
     <strong style="color:#e2e8f0;">manage</strong> —
@@ -1052,7 +1052,7 @@ <h2>What We Just Saw</h2>
   </ul>
 
   <div class="callout" style="margin-top:.8em; font-size:.8em; text-align:center; max-width:600px; margin-left:auto; margin-right:auto;">
-    Any Claude Code session. One MCP config file. Shared memory across the whole team.
+    Any MCP-compatible agent. One config file. Shared memory across every session.
   </div>
 </section>