fix(ai-chat): OpenAI Chat Completions for multi-turn + provider settings, stream UX & errors" -m "Live-stand fixes (OpenRouter / OpenAI-compatible):

- openai provider: use .chat() (Chat Completions) instead of the default callable (Responses API), which gateways reject on multi-turn -> 400. - updateAiProviderSettings: assemble settings.ai.provider via jsonb_build_object with ::text-cast bound params + jsonb_typeof self-heal (postgres.js was double-encoding it into an array; the ::text cast avoids 'could not determine data type of parameter'). - chat agent: drop the hard maxOutputTokens cap (truncated complex tool calls); keep a tiny cap only on the test-connection ping. - testConnection + chat stream: surface the real provider error (statusCode+message) to logs and the UI instead of generic masks; never log the API key. - chat UI: typing indicator, incremental streaming render, tool 'running' status, Stop. Also bundled (prior uncommitted ai-chat work): - history 'AI agent' provenance badge; vector RAG (pgvector image + page_embeddings + AI_QUEUE indexer + space-scoped semanticSearch); external MCP servers backend (@ai-sdk/mcp client, SSRF IP-pinning, encrypted headers, admin CRUD/Test); yjs duplicate-instance fix via pnpm patch (single CJS instance server-side).
2026-06-17 04:28:29 +03:00
parent 44b340dc1a
commit a4b7919753
44 changed files with 2633 additions and 122 deletions
--- a/apps/server/src/database/migrations/20260617T120000-page-embeddings.ts
+++ b/apps/server/src/database/migrations/20260617T120000-page-embeddings.ts
@@ -0,0 +1,107 @@
+import { type Kysely, sql } from 'kysely';
+
+/**
+ * Vector-RAG storage for the AI agent (§5.5 / §6.7 stage D / §14[M6,M7]).
+ *
+ * Creates the pgvector `vector` extension and the `page_embeddings` table that
+ * backs semantic search. Columns mirror the hand-written `PageEmbeddings`
+ * Kysely type (apps/server/src/database/types/embeddings.types.ts) one-to-one.
+ *
+ * The indexer + `semanticSearch` tool are a later unit; this migration only
+ * provisions the extension, the table and its indexes.
+ *
+ * The `embedding` column is `vector(EMBEDDING_DIMENSIONS)`. The dimension is
+ * FIXED at table-creation time and must match the embedding model in use.
+ * 1536 is the default for OpenAI `text-embedding-3-small` / `-ada-002`.
+ * Switching to a model with a DIFFERENT dimension (e.g. Gemini
+ * `text-embedding-004` = 768, Ollama `nomic-embed-text` = 768) requires
+ * re-creating the column and rebuilding the HNSW index. The actual model and
+ * its dimension are recorded PER ROW in `model_name` / `model_dimensions` so a
+ * future migration can detect and re-index mismatched rows.
+ */
+const EMBEDDING_DIMENSIONS = 1536;
+
+export async function up(db: Kysely<any>): Promise<void> {
+  // pgvector extension (provided by the pgvector/pgvector:pg18 image).
+  await sql`CREATE EXTENSION IF NOT EXISTS vector`.execute(db);
+
+  await db.schema
+    .createTable('page_embeddings')
+    .ifNotExists()
+    .addColumn('id', 'uuid', (col) =>
+      col.primaryKey().defaultTo(sql`gen_uuid_v7()`),
+    )
+    .addColumn('workspace_id', 'uuid', (col) =>
+      col.notNull().references('workspaces.id').onDelete('cascade'),
+    )
+    .addColumn('page_id', 'uuid', (col) =>
+      col.notNull().references('pages.id').onDelete('cascade'),
+    )
+    .addColumn('space_id', 'uuid', (col) =>
+      col.notNull().references('spaces.id').onDelete('cascade'),
+    )
+    // Embeddings may cover an attachment instead of page body; nullable, and the
+    // attachment row going away should drop its embeddings.
+    .addColumn('attachment_id', 'uuid', (col) =>
+      col.references('attachments.id').onDelete('cascade'),
+    )
+    // One row per chunk of a page; chunk_index orders them within the page.
+    .addColumn('chunk_index', 'integer', (col) => col.notNull().defaultTo(0))
+    .addColumn('chunk_start', 'integer', (col) => col.notNull().defaultTo(0))
+    .addColumn('chunk_length', 'integer', (col) => col.notNull().defaultTo(0))
+    // The chunk text that produced the embedding (always set by the indexer).
+    .addColumn('content', 'text', (col) => col.notNull())
+    // Provenance of the vector: model id + its output dimension (see header).
+    .addColumn('model_name', 'varchar', (col) => col.notNull())
+    .addColumn('model_dimensions', 'integer', (col) => col.notNull())
+    // Fixed-dimension vector column. Raw type since pgvector's `vector(N)` is not
+    // a native Kysely column type.
+    .addColumn(
+      'embedding',
+      sql`vector(${sql.raw(String(EMBEDDING_DIMENSIONS))})`,
+    )
+    .addColumn('metadata', 'jsonb', (col) =>
+      col.notNull().defaultTo(sql`'{}'::jsonb`),
+    )
+    .addColumn('created_at', 'timestamptz', (col) =>
+      col.notNull().defaultTo(sql`now()`),
+    )
+    .addColumn('updated_at', 'timestamptz', (col) =>
+      col.notNull().defaultTo(sql`now()`),
+    )
+    .addColumn('deleted_at', 'timestamptz', (col) => col)
+    // One stored vector per (page, chunk).
+    .addUniqueConstraint('uq_page_embeddings_page_chunk', [
+      'page_id',
+      'chunk_index',
+    ])
+    .execute();
+
+  // ANN index for cosine-similarity search over the embedding vectors (HNSW).
+  await sql`
+    CREATE INDEX IF NOT EXISTS idx_page_embeddings_embedding_hnsw
+      ON page_embeddings
+      USING hnsw (embedding vector_cosine_ops)
+  `.execute(db);
+
+  // Btree indexes for scoped lookups/deletes (re-index a page, purge a workspace).
+  await db.schema
+    .createIndex('idx_page_embeddings_page_id')
+    .ifNotExists()
+    .on('page_embeddings')
+    .column('page_id')
+    .execute();
+
+  await db.schema
+    .createIndex('idx_page_embeddings_workspace_id')
+    .ifNotExists()
+    .on('page_embeddings')
+    .column('workspace_id')
+    .execute();
+}
+
+export async function down(db: Kysely<any>): Promise<void> {
+  // Drop the table only; leave the `vector` extension in place (it may be used
+  // by other objects and dropping it is destructive).
+  await db.schema.dropTable('page_embeddings').ifExists().execute();
+}
--- a/apps/server/src/database/migrations/20260617T130000-ai-mcp-servers.ts
+++ b/apps/server/src/database/migrations/20260617T130000-ai-mcp-servers.ts
@@ -0,0 +1,44 @@
+import { type Kysely, sql } from 'kysely';
+
+export async function up(db: Kysely<any>): Promise<void> {
+  await db.schema
+    .createTable('ai_mcp_servers')
+    .ifNotExists()
+    .addColumn('id', 'uuid', (col) =>
+      col.primaryKey().defaultTo(sql`gen_uuid_v7()`),
+    )
+    .addColumn('workspace_id', 'uuid', (col) =>
+      col.references('workspaces.id').onDelete('cascade').notNull(),
+    )
+    // display name, e.g. 'Tavily'.
+    .addColumn('name', 'varchar', (col) => col.notNull())
+    // 'http' | 'sse' — the @ai-sdk/mcp transport type.
+    .addColumn('transport', 'varchar', (col) => col.notNull())
+    // remote MCP endpoint URL.
+    .addColumn('url', 'text', (col) => col.notNull())
+    // SECURITY (§8.10): AES-256-GCM blob of the JSON auth headers. Write-only;
+    // NEVER added to workspace baseFields and NEVER returned by any endpoint.
+    .addColumn('headers_enc', 'text', (col) => col)
+    // optional: restrict which remote tool names to expose to the agent.
+    .addColumn('tool_allowlist', 'jsonb', (col) => col)
+    .addColumn('enabled', 'boolean', (col) => col.notNull().defaultTo(true))
+    .addColumn('created_at', 'timestamptz', (col) =>
+      col.notNull().defaultTo(sql`now()`),
+    )
+    .addColumn('updated_at', 'timestamptz', (col) =>
+      col.notNull().defaultTo(sql`now()`),
+    )
+    .execute();
+
+  // Scoped lookups (listByWorkspace / listEnabled) hit workspace_id first.
+  await db.schema
+    .createIndex('ai_mcp_servers_workspace_id_idx')
+    .ifNotExists()
+    .on('ai_mcp_servers')
+    .column('workspace_id')
+    .execute();
+}
+
+export async function down(db: Kysely<any>): Promise<void> {
+  await db.schema.dropTable('ai_mcp_servers').execute();
+}