fix(ai-chat): OpenAI Chat Completions for multi-turn + provider settings, stream UX & errors" -m "Live-stand fixes (OpenRouter / OpenAI-compatible):

- openai provider: use .chat() (Chat Completions) instead of the default callable
  (Responses API), which gateways reject on multi-turn -> 400.
- updateAiProviderSettings: assemble settings.ai.provider via jsonb_build_object
  with ::text-cast bound params + jsonb_typeof self-heal (postgres.js was
  double-encoding it into an array; the ::text cast avoids 'could not determine
  data type of parameter').
- chat agent: drop the hard maxOutputTokens cap (truncated complex tool calls);
  keep a tiny cap only on the test-connection ping.
- testConnection + chat stream: surface the real provider error (statusCode+message)
  to logs and the UI instead of generic masks; never log the API key.
- chat UI: typing indicator, incremental streaming render, tool 'running' status, Stop.

Also bundled (prior uncommitted ai-chat work):
- history 'AI agent' provenance badge; vector RAG (pgvector image + page_embeddings
  + AI_QUEUE indexer + space-scoped semanticSearch); external MCP servers backend
  (@ai-sdk/mcp client, SSRF IP-pinning, encrypted headers, admin CRUD/Test);
  yjs duplicate-instance fix via pnpm patch (single CJS instance server-side).
This commit is contained in:
vvzvlad
2026-06-17 04:28:29 +03:00
parent 44b340dc1a
commit a4b7919753
44 changed files with 2633 additions and 122 deletions

View File

@@ -0,0 +1,107 @@
import { type Kysely, sql } from 'kysely';
/**
* Vector-RAG storage for the AI agent (§5.5 / §6.7 stage D / §14[M6,M7]).
*
* Creates the pgvector `vector` extension and the `page_embeddings` table that
* backs semantic search. Columns mirror the hand-written `PageEmbeddings`
* Kysely type (apps/server/src/database/types/embeddings.types.ts) one-to-one.
*
* The indexer + `semanticSearch` tool are a later unit; this migration only
* provisions the extension, the table and its indexes.
*
* The `embedding` column is `vector(EMBEDDING_DIMENSIONS)`. The dimension is
* FIXED at table-creation time and must match the embedding model in use.
* 1536 is the default for OpenAI `text-embedding-3-small` / `-ada-002`.
* Switching to a model with a DIFFERENT dimension (e.g. Gemini
* `text-embedding-004` = 768, Ollama `nomic-embed-text` = 768) requires
* re-creating the column and rebuilding the HNSW index. The actual model and
* its dimension are recorded PER ROW in `model_name` / `model_dimensions` so a
* future migration can detect and re-index mismatched rows.
*/
const EMBEDDING_DIMENSIONS = 1536;
export async function up(db: Kysely<any>): Promise<void> {
// pgvector extension (provided by the pgvector/pgvector:pg18 image).
await sql`CREATE EXTENSION IF NOT EXISTS vector`.execute(db);
await db.schema
.createTable('page_embeddings')
.ifNotExists()
.addColumn('id', 'uuid', (col) =>
col.primaryKey().defaultTo(sql`gen_uuid_v7()`),
)
.addColumn('workspace_id', 'uuid', (col) =>
col.notNull().references('workspaces.id').onDelete('cascade'),
)
.addColumn('page_id', 'uuid', (col) =>
col.notNull().references('pages.id').onDelete('cascade'),
)
.addColumn('space_id', 'uuid', (col) =>
col.notNull().references('spaces.id').onDelete('cascade'),
)
// Embeddings may cover an attachment instead of page body; nullable, and the
// attachment row going away should drop its embeddings.
.addColumn('attachment_id', 'uuid', (col) =>
col.references('attachments.id').onDelete('cascade'),
)
// One row per chunk of a page; chunk_index orders them within the page.
.addColumn('chunk_index', 'integer', (col) => col.notNull().defaultTo(0))
.addColumn('chunk_start', 'integer', (col) => col.notNull().defaultTo(0))
.addColumn('chunk_length', 'integer', (col) => col.notNull().defaultTo(0))
// The chunk text that produced the embedding (always set by the indexer).
.addColumn('content', 'text', (col) => col.notNull())
// Provenance of the vector: model id + its output dimension (see header).
.addColumn('model_name', 'varchar', (col) => col.notNull())
.addColumn('model_dimensions', 'integer', (col) => col.notNull())
// Fixed-dimension vector column. Raw type since pgvector's `vector(N)` is not
// a native Kysely column type.
.addColumn(
'embedding',
sql`vector(${sql.raw(String(EMBEDDING_DIMENSIONS))})`,
)
.addColumn('metadata', 'jsonb', (col) =>
col.notNull().defaultTo(sql`'{}'::jsonb`),
)
.addColumn('created_at', 'timestamptz', (col) =>
col.notNull().defaultTo(sql`now()`),
)
.addColumn('updated_at', 'timestamptz', (col) =>
col.notNull().defaultTo(sql`now()`),
)
.addColumn('deleted_at', 'timestamptz', (col) => col)
// One stored vector per (page, chunk).
.addUniqueConstraint('uq_page_embeddings_page_chunk', [
'page_id',
'chunk_index',
])
.execute();
// ANN index for cosine-similarity search over the embedding vectors (HNSW).
await sql`
CREATE INDEX IF NOT EXISTS idx_page_embeddings_embedding_hnsw
ON page_embeddings
USING hnsw (embedding vector_cosine_ops)
`.execute(db);
// Btree indexes for scoped lookups/deletes (re-index a page, purge a workspace).
await db.schema
.createIndex('idx_page_embeddings_page_id')
.ifNotExists()
.on('page_embeddings')
.column('page_id')
.execute();
await db.schema
.createIndex('idx_page_embeddings_workspace_id')
.ifNotExists()
.on('page_embeddings')
.column('workspace_id')
.execute();
}
export async function down(db: Kysely<any>): Promise<void> {
// Drop the table only; leave the `vector` extension in place (it may be used
// by other objects and dropping it is destructive).
await db.schema.dropTable('page_embeddings').ifExists().execute();
}

View File

@@ -0,0 +1,44 @@
import { type Kysely, sql } from 'kysely';
export async function up(db: Kysely<any>): Promise<void> {
await db.schema
.createTable('ai_mcp_servers')
.ifNotExists()
.addColumn('id', 'uuid', (col) =>
col.primaryKey().defaultTo(sql`gen_uuid_v7()`),
)
.addColumn('workspace_id', 'uuid', (col) =>
col.references('workspaces.id').onDelete('cascade').notNull(),
)
// display name, e.g. 'Tavily'.
.addColumn('name', 'varchar', (col) => col.notNull())
// 'http' | 'sse' — the @ai-sdk/mcp transport type.
.addColumn('transport', 'varchar', (col) => col.notNull())
// remote MCP endpoint URL.
.addColumn('url', 'text', (col) => col.notNull())
// SECURITY (§8.10): AES-256-GCM blob of the JSON auth headers. Write-only;
// NEVER added to workspace baseFields and NEVER returned by any endpoint.
.addColumn('headers_enc', 'text', (col) => col)
// optional: restrict which remote tool names to expose to the agent.
.addColumn('tool_allowlist', 'jsonb', (col) => col)
.addColumn('enabled', 'boolean', (col) => col.notNull().defaultTo(true))
.addColumn('created_at', 'timestamptz', (col) =>
col.notNull().defaultTo(sql`now()`),
)
.addColumn('updated_at', 'timestamptz', (col) =>
col.notNull().defaultTo(sql`now()`),
)
.execute();
// Scoped lookups (listByWorkspace / listEnabled) hit workspace_id first.
await db.schema
.createIndex('ai_mcp_servers_workspace_id_idx')
.ifNotExists()
.on('ai_mcp_servers')
.column('workspace_id')
.execute();
}
export async function down(db: Kysely<any>): Promise<void> {
await db.schema.dropTable('ai_mcp_servers').execute();
}