-
Notifications
You must be signed in to change notification settings - Fork 4
Expand file tree
/
Copy pathcreate-tables.sql
More file actions
164 lines (145 loc) · 5.98 KB
/
create-tables.sql
File metadata and controls
164 lines (145 loc) · 5.98 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
-- Create tables for AGI Detector
-- Enable pgvector extension (required for embeddings)
CREATE EXTENSION IF NOT EXISTS vector;
-- Create CrawlResult table
CREATE TABLE IF NOT EXISTS "CrawlResult" (
"id" TEXT NOT NULL DEFAULT gen_random_uuid(),
"url" TEXT NOT NULL,
"title" TEXT NOT NULL,
"content" TEXT NOT NULL,
"timestamp" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
"metadata" JSONB NOT NULL,
CONSTRAINT "CrawlResult_pkey" PRIMARY KEY ("id")
);
-- Create AnalysisResult table
CREATE TABLE IF NOT EXISTS "AnalysisResult" (
"id" TEXT NOT NULL DEFAULT gen_random_uuid(),
"crawlId" TEXT NOT NULL,
"score" DOUBLE PRECISION NOT NULL,
"modelScore" DOUBLE PRECISION,
"heuristicScore" DOUBLE PRECISION,
"scoreBreakdown" JSONB,
"indicators" TEXT[] NOT NULL,
"confidence" DOUBLE PRECISION NOT NULL,
"embedding" vector(512),
"timestamp" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
CONSTRAINT "AnalysisResult_pkey" PRIMARY KEY ("id")
);
-- Create indexes
CREATE INDEX IF NOT EXISTS "CrawlResult_url_idx" ON "CrawlResult"("url");
CREATE INDEX IF NOT EXISTS "AnalysisResult_score_idx" ON "AnalysisResult"("score");
-- Create unique constraints
CREATE UNIQUE INDEX IF NOT EXISTS "AnalysisResult_crawlId_key" ON "AnalysisResult"("crawlId");
-- Add foreign key constraint
ALTER TABLE "AnalysisResult" ADD CONSTRAINT "AnalysisResult_crawlId_fkey"
FOREIGN KEY ("crawlId") REFERENCES "CrawlResult"("id")
ON DELETE RESTRICT ON UPDATE CASCADE;
-- TrendAnalysis dedupe support (if table already exists)
ALTER TABLE "TrendAnalysis" ADD COLUMN IF NOT EXISTS "dateBucket" DATE;
CREATE UNIQUE INDEX IF NOT EXISTS "TrendAnalysis_period_dateBucket_key"
ON "TrendAnalysis"(period, "dateBucket");
-- App state (last crawl run time, etc.)
CREATE TABLE IF NOT EXISTS "AppState" (
key TEXT PRIMARY KEY,
value JSONB NOT NULL,
"updatedAt" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP
);
-- Correlation findings (co-occurrence across sources)
CREATE TABLE IF NOT EXISTS "CorrelationFinding" (
id TEXT NOT NULL DEFAULT gen_random_uuid(),
"windowDays" INTEGER NOT NULL,
indicator TEXT NOT NULL,
benchmark TEXT NOT NULL,
metric TEXT,
"avgDelta" DOUBLE PRECISION,
"maxDelta" DOUBLE PRECISION,
"analysisCount" INTEGER NOT NULL,
"sourceCount" INTEGER NOT NULL,
sources TEXT[] NOT NULL DEFAULT '{}',
"analysisIds" TEXT[] NOT NULL DEFAULT '{}',
urls TEXT[] NOT NULL DEFAULT '{}',
"createdAt" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
"updatedAt" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
CONSTRAINT "CorrelationFinding_pkey" PRIMARY KEY (id)
);
CREATE UNIQUE INDEX IF NOT EXISTS "CorrelationFinding_window_indicator_benchmark_metric_key"
ON "CorrelationFinding"("windowDays", indicator, benchmark, metric);
CREATE INDEX IF NOT EXISTS "CorrelationFinding_updatedAt_idx"
ON "CorrelationFinding"("updatedAt");
-- LLM insights (natural interpretations across sources)
CREATE TABLE IF NOT EXISTS "InsightFinding" (
id TEXT NOT NULL DEFAULT gen_random_uuid(),
"windowDays" INTEGER NOT NULL,
title TEXT NOT NULL,
summary TEXT NOT NULL,
confidence DOUBLE PRECISION NOT NULL,
sources TEXT[] NOT NULL DEFAULT '{}',
urls TEXT[] NOT NULL DEFAULT '{}',
"evidenceSnippets" TEXT[] NOT NULL DEFAULT '{}',
"createdAt" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
"updatedAt" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
CONSTRAINT "InsightFinding_pkey" PRIMARY KEY (id)
);
CREATE UNIQUE INDEX IF NOT EXISTS "InsightFinding_window_title_key"
ON "InsightFinding"("windowDays", title);
CREATE INDEX IF NOT EXISTS "InsightFinding_updatedAt_idx"
ON "InsightFinding"("updatedAt");
-- Analyze-all job tracking
CREATE TABLE IF NOT EXISTS "AnalysisJob" (
id TEXT NOT NULL DEFAULT gen_random_uuid(),
status TEXT NOT NULL,
"totalArticles" INTEGER NOT NULL DEFAULT 0,
"processedArticles" INTEGER NOT NULL DEFAULT 0,
"successfulAnalyses" INTEGER NOT NULL DEFAULT 0,
"failedAnalyses" INTEGER NOT NULL DEFAULT 0,
"currentArticle" TEXT,
"avgBatchTime" DOUBLE PRECISION,
"estimatedTimeRemaining" DOUBLE PRECISION,
error TEXT,
"startedAt" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
"completedAt" TIMESTAMP(3),
CONSTRAINT "AnalysisJob_pkey" PRIMARY KEY (id)
);
CREATE INDEX IF NOT EXISTS "AnalysisJob_startedAt_idx"
ON "AnalysisJob"("startedAt");
-- Evidence claims table
CREATE TABLE IF NOT EXISTS "EvidenceClaim" (
id TEXT NOT NULL DEFAULT gen_random_uuid(),
"crawlId" TEXT NOT NULL,
claim TEXT NOT NULL,
evidence TEXT NOT NULL,
benchmark TEXT,
metric TEXT,
value DOUBLE PRECISION,
delta DOUBLE PRECISION,
unit TEXT,
tags TEXT[] NOT NULL DEFAULT '{}',
numbers DOUBLE PRECISION[] NOT NULL DEFAULT '{}',
url TEXT,
"canonicalUrl" TEXT,
"createdAt" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
CONSTRAINT "EvidenceClaim_pkey" PRIMARY KEY (id)
);
CREATE UNIQUE INDEX IF NOT EXISTS "EvidenceClaim_crawlId_claim_key" ON "EvidenceClaim"("crawlId", claim);
CREATE INDEX IF NOT EXISTS "EvidenceClaim_crawlId_idx" ON "EvidenceClaim"("crawlId");
CREATE INDEX IF NOT EXISTS "EvidenceClaim_benchmark_idx" ON "EvidenceClaim"(benchmark);
-- Accuracy metrics (evals snapshots)
CREATE TABLE IF NOT EXISTS "AccuracyMetrics" (
id TEXT NOT NULL DEFAULT gen_random_uuid(),
period TEXT NOT NULL,
"timestamp" TIMESTAMP(3) NOT NULL DEFAULT CURRENT_TIMESTAMP,
"truePositives" INTEGER NOT NULL,
"falsePositives" INTEGER NOT NULL,
"trueNegatives" INTEGER NOT NULL,
"falseNegatives" INTEGER NOT NULL,
"precision" DOUBLE PRECISION NOT NULL,
recall DOUBLE PRECISION NOT NULL,
"f1Score" DOUBLE PRECISION NOT NULL,
accuracy DOUBLE PRECISION NOT NULL,
"falsePositiveRate" DOUBLE PRECISION NOT NULL,
"falseNegativeRate" DOUBLE PRECISION NOT NULL,
"totalReviewed" INTEGER NOT NULL,
"avgConfidence" DOUBLE PRECISION,
notes TEXT,
CONSTRAINT "AccuracyMetrics_pkey" PRIMARY KEY (id)
);