-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathschema.sql
More file actions
36 lines (31 loc) · 1.12 KB
/
Copy pathschema.sql
File metadata and controls
36 lines (31 loc) · 1.12 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
-- Knowledge Base PostgreSQL Schema
-- Requires: pgvector extension
-- Enable vector extension
CREATE EXTENSION IF NOT EXISTS vector;
-- Main documents table
CREATE TABLE documents (
id BIGSERIAL PRIMARY KEY,
source_path TEXT NOT NULL UNIQUE,
title TEXT NOT NULL,
content TEXT NOT NULL,
category VARCHAR(100),
metadata JSONB DEFAULT '{}',
created_at TIMESTAMP DEFAULT NOW(),
updated_at TIMESTAMP DEFAULT NOW()
);
-- Summaries table with vector embeddings
CREATE TABLE summaries (
id BIGSERIAL PRIMARY KEY,
document_id BIGINT NOT NULL REFERENCES documents(id) ON DELETE CASCADE,
content TEXT NOT NULL,
tokens INT,
embedding VECTOR(1536),
model_name TEXT NOT NULL,
generation_timestamp TIMESTAMP DEFAULT NOW()
);
-- Indexes
CREATE INDEX idx_documents_category ON documents(category);
CREATE INDEX idx_documents_updated ON documents(updated_at);
CREATE INDEX idx_documents_metadata ON documents USING gin(metadata);
CREATE INDEX summaries_content_gin ON summaries USING gin(to_tsvector('english', content));
CREATE INDEX summaries_embedding_idx ON summaries USING ivfflat(embedding vector_l2_ops) WITH (lists = 100);