-
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathmigrations.sql
More file actions
229 lines (188 loc) · 8.58 KB
/
migrations.sql
File metadata and controls
229 lines (188 loc) · 8.58 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
-- Info Naut Database Schema
-- This file documents the database schema for reference
-- Actual migrations run automatically via Alembic on application startup
-- ============================================================
-- USERS TABLE (Auth system - currently unused in guest mode)
-- ============================================================
CREATE TABLE IF NOT EXISTS users (
id INTEGER PRIMARY KEY AUTOINCREMENT,
email VARCHAR(255) UNIQUE NOT NULL,
username VARCHAR(255) UNIQUE NOT NULL,
hashed_password VARCHAR(255) NOT NULL,
is_active BOOLEAN DEFAULT 1,
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
);
CREATE INDEX IF NOT EXISTS idx_users_email ON users(email);
CREATE INDEX IF NOT EXISTS idx_users_username ON users(username);
-- ============================================================
-- API KEYS TABLE
-- ============================================================
CREATE TABLE IF NOT EXISTS api_keys (
id INTEGER PRIMARY KEY AUTOINCREMENT,
key_hash VARCHAR(512) NOT NULL,
name VARCHAR(255) NOT NULL,
user_id INTEGER NOT NULL,
is_active BOOLEAN DEFAULT 1,
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
expires_at TIMESTAMP,
last_used_at TIMESTAMP,
FOREIGN KEY (user_id) REFERENCES users(id) ON DELETE CASCADE
);
CREATE INDEX IF NOT EXISTS idx_api_keys_user ON api_keys(user_id);
CREATE INDEX IF NOT EXISTS idx_api_keys_active ON api_keys(is_active);
-- ============================================================
-- KNOWLEDGE BASES TABLE
-- ============================================================
CREATE TABLE IF NOT EXISTS knowledge_bases (
id INTEGER PRIMARY KEY AUTOINCREMENT,
name VARCHAR(255) NOT NULL,
description TEXT,
user_id INTEGER NOT NULL,
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
FOREIGN KEY (user_id) REFERENCES users(id) ON DELETE CASCADE
);
CREATE INDEX IF NOT EXISTS idx_kb_user ON knowledge_bases(user_id);
CREATE INDEX IF NOT EXISTS idx_kb_created ON knowledge_bases(created_at);
-- ============================================================
-- DOCUMENTS TABLE
-- ============================================================
CREATE TABLE IF NOT EXISTS documents (
id INTEGER PRIMARY KEY AUTOINCREMENT,
filename VARCHAR(255) NOT NULL,
file_path VARCHAR(512) NOT NULL,
file_size INTEGER,
mime_type VARCHAR(128),
knowledge_base_id INTEGER NOT NULL,
status VARCHAR(50) DEFAULT 'pending', -- pending, processing, completed, failed
processing_started_at TIMESTAMP,
processing_completed_at TIMESTAMP,
error_message TEXT,
chunk_count INTEGER DEFAULT 0,
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
FOREIGN KEY (knowledge_base_id) REFERENCES knowledge_bases(id) ON DELETE CASCADE
);
CREATE INDEX IF NOT EXISTS idx_documents_kb ON documents(knowledge_base_id);
CREATE INDEX IF NOT EXISTS idx_documents_status ON documents(status);
CREATE INDEX IF NOT EXISTS idx_documents_created ON documents(created_at);
-- ============================================================
-- DOCUMENT UPLOADS TABLE (Processing Queue)
-- ============================================================
CREATE TABLE IF NOT EXISTS document_uploads (
id VARCHAR(255) PRIMARY KEY,
filename VARCHAR(255) NOT NULL,
knowledge_base_id INTEGER NOT NULL,
status VARCHAR(50) DEFAULT 'pending',
document_id INTEGER,
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
FOREIGN KEY (knowledge_base_id) REFERENCES knowledge_bases(id) ON DELETE CASCADE,
FOREIGN KEY (document_id) REFERENCES documents(id) ON DELETE SET NULL
);
CREATE INDEX IF NOT EXISTS idx_uploads_kb ON document_uploads(knowledge_base_id);
CREATE INDEX IF NOT EXISTS idx_uploads_status ON document_uploads(status);
-- ============================================================
-- CHUNKS TABLE (Document Chunks for RAG)
-- ============================================================
CREATE TABLE IF NOT EXISTS chunks (
id INTEGER PRIMARY KEY AUTOINCREMENT,
document_id INTEGER NOT NULL,
doc_id VARCHAR(255) NOT NULL, -- Unique document identifier
chunk_id VARCHAR(255) NOT NULL UNIQUE, -- Unique chunk identifier
content TEXT NOT NULL,
line_start INTEGER NOT NULL,
line_end INTEGER NOT NULL,
char_start INTEGER NOT NULL,
char_end INTEGER NOT NULL,
chunk_metadata TEXT, -- JSON metadata
embedding_id VARCHAR(255), -- Reference to vector store
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
FOREIGN KEY (document_id) REFERENCES documents(id) ON DELETE CASCADE
);
CREATE INDEX IF NOT EXISTS idx_chunks_document ON chunks(document_id);
CREATE INDEX IF NOT EXISTS idx_chunks_doc_id ON chunks(doc_id);
CREATE INDEX IF NOT EXISTS idx_chunks_chunk_id ON chunks(chunk_id);
-- ============================================================
-- CHATS TABLE
-- ============================================================
CREATE TABLE IF NOT EXISTS chats (
id INTEGER PRIMARY KEY AUTOINCREMENT,
title VARCHAR(255),
user_id INTEGER NOT NULL,
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
FOREIGN KEY (user_id) REFERENCES users(id) ON DELETE CASCADE
);
CREATE INDEX IF NOT EXISTS idx_chats_user ON chats(user_id);
CREATE INDEX IF NOT EXISTS idx_chats_created ON chats(created_at);
-- ============================================================
-- CHAT_KNOWLEDGE_BASES TABLE (Many-to-Many)
-- ============================================================
CREATE TABLE IF NOT EXISTS chat_knowledge_bases (
chat_id INTEGER NOT NULL,
knowledge_base_id INTEGER NOT NULL,
PRIMARY KEY (chat_id, knowledge_base_id),
FOREIGN KEY (chat_id) REFERENCES chats(id) ON DELETE CASCADE,
FOREIGN KEY (knowledge_base_id) REFERENCES knowledge_bases(id) ON DELETE CASCADE
);
CREATE INDEX IF NOT EXISTS idx_chat_kb_chat ON chat_knowledge_bases(chat_id);
CREATE INDEX IF NOT EXISTS idx_chat_kb_kb ON chat_knowledge_bases(knowledge_base_id);
-- ============================================================
-- MESSAGES TABLE
-- ============================================================
CREATE TABLE IF NOT EXISTS messages (
id INTEGER PRIMARY KEY AUTOINCREMENT,
content TEXT NOT NULL,
role VARCHAR(50) NOT NULL, -- user, assistant, system
chat_id INTEGER NOT NULL,
metadata TEXT, -- JSON metadata (citations, grounding score, etc.)
created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
FOREIGN KEY (chat_id) REFERENCES chats(id) ON DELETE CASCADE
);
CREATE INDEX IF NOT EXISTS idx_messages_chat ON messages(chat_id);
CREATE INDEX IF NOT EXISTS idx_messages_created ON messages(created_at);
-- ============================================================
-- VECTOR STORE METADATA (Optional - for SQLite vector index)
-- ============================================================
-- Note: If using FAISS/HNSWlib with SQLite, vectors are stored
-- in separate binary files, referenced by embedding_id in chunks table
-- ============================================================
-- EXAMPLE QUERIES
-- ============================================================
-- Get all knowledge bases for a user
-- SELECT * FROM knowledge_bases WHERE user_id = ?;
-- Get all documents in a knowledge base with processing status
-- SELECT * FROM documents WHERE knowledge_base_id = ? ORDER BY created_at DESC;
-- Get chunks for a document with citation metadata
-- SELECT doc_id, chunk_id, content, line_start, line_end
-- FROM chunks WHERE document_id = ? ORDER BY chunk_id;
-- Get chat history with messages
-- SELECT m.* FROM messages m
-- JOIN chats c ON m.chat_id = c.id
-- WHERE c.id = ? ORDER BY m.created_at;
-- ============================================================
-- MIGRATION NOTES
-- ============================================================
-- This schema is automatically applied via Alembic migrations
-- located in backend/alembic/versions/
--
-- To apply migrations manually (not recommended):
-- cd backend
-- alembic upgrade head
--
-- To create a new migration:
-- alembic revision --autogenerate -m "description"
--
-- Database auto-initializes on first application startup
-- No manual SQL execution required
-- ============================================================
-- SQLITE OPTIMIZATIONS
-- ============================================================
-- Enable WAL mode for better concurrency
PRAGMA journal_mode=WAL;
-- Increase cache size (64MB)
PRAGMA cache_size=-64000;
-- Enable foreign keys
PRAGMA foreign_keys=ON;