summaryrefslogtreecommitdiff
path: root/storage
diff options
context:
space:
mode:
authorGrail Finder <wohilas@gmail.com>2024-12-31 13:25:13 +0300
committerGrail Finder <wohilas@gmail.com>2024-12-31 13:25:13 +0300
commit461d19aa2512fea7ac07e50c3178609850ef07c3 (patch)
tree1e317b813686ca7696e96bba766cdbd3aeb35138 /storage
parent4db8aea43dded3f2c1d0d41b5a3fb322a38d4730 (diff)
Feat: add rag [wip; skip-ci]
Diffstat (limited to 'storage')
-rw-r--r--storage/migrate.go5
-rw-r--r--storage/migrations/002_add_vector.up.sql6
-rw-r--r--storage/storage.go9
-rw-r--r--storage/storage_test.go88
-rw-r--r--storage/vector.go89
5 files changed, 196 insertions, 1 deletions
diff --git a/storage/migrate.go b/storage/migrate.go
index d97b99d..3c4ca21 100644
--- a/storage/migrate.go
+++ b/storage/migrate.go
@@ -5,6 +5,8 @@ import (
"fmt"
"io/fs"
"strings"
+
+ _ "github.com/asg017/sqlite-vec-go-bindings/ncruces"
)
//go:embed migrations/*
@@ -27,6 +29,7 @@ func (p *ProviderSQL) Migrate() {
err := p.executeMigration(migrationsDir, file.Name())
if err != nil {
p.logger.Error("Failed to execute migration %s: %v", file.Name(), err)
+ panic(err)
}
}
}
@@ -51,7 +54,7 @@ func (p *ProviderSQL) executeMigration(migrationsDir fs.FS, fileName string) err
func (p *ProviderSQL) executeSQL(sqlContent []byte) error {
// Connect to the database (example using a simple connection)
- _, err := p.db.Exec(string(sqlContent))
+ err := p.s3Conn.Exec(string(sqlContent))
if err != nil {
return fmt.Errorf("failed to execute SQL: %w", err)
}
diff --git a/storage/migrations/002_add_vector.up.sql b/storage/migrations/002_add_vector.up.sql
new file mode 100644
index 0000000..4fcc9aa
--- /dev/null
+++ b/storage/migrations/002_add_vector.up.sql
@@ -0,0 +1,6 @@
+CREATE VIRTUAL TABLE IF NOT EXISTS embeddings USING vec0(
+ id INTEGER PRIMARY KEY AUTOINCREMENT,
+ embedding FLOAT[5120],
+ slug TEXT NOT NULL,
+ raw_text TEXT NOT NULL
+);
diff --git a/storage/storage.go b/storage/storage.go
index 0853328..cfaaf0a 100644
--- a/storage/storage.go
+++ b/storage/storage.go
@@ -6,11 +6,13 @@ import (
_ "github.com/glebarez/go-sqlite"
"github.com/jmoiron/sqlx"
+ "github.com/ncruces/go-sqlite3"
)
type FullRepo interface {
ChatHistory
Memories
+ VectorRepo
}
type ChatHistory interface {
@@ -25,6 +27,7 @@ type ChatHistory interface {
type ProviderSQL struct {
db *sqlx.DB
+ s3Conn *sqlite3.Conn
logger *slog.Logger
}
@@ -87,6 +90,7 @@ func (p ProviderSQL) ChatGetMaxID() (uint32, error) {
return id, err
}
+// opens two connections
func NewProviderSQL(dbPath string, logger *slog.Logger) FullRepo {
db, err := sqlx.Open("sqlite", dbPath)
if err != nil {
@@ -94,6 +98,11 @@ func NewProviderSQL(dbPath string, logger *slog.Logger) FullRepo {
return nil
}
p := ProviderSQL{db: db, logger: logger}
+ p.s3Conn, err = sqlite3.Open(dbPath)
+ if err != nil {
+ logger.Error("failed to open vecdb connection", "error", err)
+ return nil
+ }
p.Migrate()
return p
}
diff --git a/storage/storage_test.go b/storage/storage_test.go
index 8373ab0..f6af4f5 100644
--- a/storage/storage_test.go
+++ b/storage/storage_test.go
@@ -3,13 +3,16 @@ package storage
import (
"elefant/models"
"fmt"
+ "log"
"log/slog"
"os"
"testing"
"time"
+ sqlite_vec "github.com/asg017/sqlite-vec-go-bindings/ncruces"
_ "github.com/glebarez/go-sqlite"
"github.com/jmoiron/sqlx"
+ "github.com/ncruces/go-sqlite3"
)
func TestMemories(t *testing.T) {
@@ -160,3 +163,88 @@ func TestChatHistory(t *testing.T) {
t.Errorf("Expected 0 chats, got %d", len(chats))
}
}
+
+func TestVecTable(t *testing.T) {
+ // healthcheck
+ db, err := sqlite3.Open(":memory:")
+ if err != nil {
+ t.Fatal(err)
+ }
+ stmt, _, err := db.Prepare(`SELECT sqlite_version(), vec_version()`)
+ if err != nil {
+ t.Fatal(err)
+ }
+ stmt.Step()
+ log.Printf("sqlite_version=%s, vec_version=%s\n", stmt.ColumnText(0), stmt.ColumnText(1))
+ stmt.Close()
+ // migration
+ err = db.Exec("CREATE VIRTUAL TABLE vec_items USING vec0(embedding float[4], chat_name TEXT NOT NULL)")
+ if err != nil {
+ t.Fatal(err)
+ }
+ // data prep and insert
+ items := map[int][]float32{
+ 1: {0.1, 0.1, 0.1, 0.1},
+ 2: {0.2, 0.2, 0.2, 0.2},
+ 3: {0.3, 0.3, 0.3, 0.3},
+ 4: {0.4, 0.4, 0.4, 0.4},
+ 5: {0.5, 0.5, 0.5, 0.5},
+ }
+ q := []float32{0.28, 0.3, 0.3, 0.3}
+ stmt, _, err = db.Prepare("INSERT INTO vec_items(rowid, embedding, chat_name) VALUES (?, ?, ?)")
+ if err != nil {
+ t.Fatal(err)
+ }
+ for id, values := range items {
+ v, err := sqlite_vec.SerializeFloat32(values)
+ if err != nil {
+ t.Fatal(err)
+ }
+ stmt.BindInt(1, id)
+ stmt.BindBlob(2, v)
+ stmt.BindText(3, "some_chat")
+ err = stmt.Exec()
+ if err != nil {
+ t.Fatal(err)
+ }
+ stmt.Reset()
+ }
+ stmt.Close()
+ // select | vec search
+ stmt, _, err = db.Prepare(`
+ SELECT
+ rowid,
+ distance,
+ embedding
+ FROM vec_items
+ WHERE embedding MATCH ?
+ ORDER BY distance
+ LIMIT 3
+ `)
+ if err != nil {
+ t.Fatal(err)
+ }
+ query, err := sqlite_vec.SerializeFloat32(q)
+ if err != nil {
+ t.Fatal(err)
+ }
+ stmt.BindBlob(1, query)
+ for stmt.Step() {
+ rowid := stmt.ColumnInt64(0)
+ distance := stmt.ColumnFloat(1)
+ emb := stmt.ColumnRawText(2)
+ floats := decodeUnsafe(emb)
+ log.Printf("rowid=%d, distance=%f, floats=%v\n", rowid, distance, floats)
+ }
+ if err := stmt.Err(); err != nil {
+ t.Fatal(err)
+ }
+ err = stmt.Close()
+ if err != nil {
+ t.Fatal(err)
+ }
+ err = db.Close()
+ if err != nil {
+ t.Fatal(err)
+ }
+}
diff --git a/storage/vector.go b/storage/vector.go
new file mode 100644
index 0000000..bc46734
--- /dev/null
+++ b/storage/vector.go
@@ -0,0 +1,89 @@
+package storage
+
+import (
+ "elefant/models"
+ "fmt"
+ "log"
+ "unsafe"
+
+ sqlite_vec "github.com/asg017/sqlite-vec-go-bindings/ncruces"
+)
+
+type VectorRepo interface {
+ WriteVector(*models.VectorRow) error
+ SearchClosest(q [5120]float32) (*models.VectorRow, error)
+}
+
+var vecTableName = "embeddings"
+
+func (p ProviderSQL) WriteVector(row *models.VectorRow) error {
+ stmt, _, err := p.s3Conn.Prepare(
+ fmt.Sprintf("INSERT INTO %s(embedding, slug, raw_text) VALUES (?, ?, ?)", vecTableName))
+ defer stmt.Close()
+ if err != nil {
+ p.logger.Error("failed to prep a stmt", "error", err)
+ return err
+ }
+ v, err := sqlite_vec.SerializeFloat32(row.Embeddings)
+ if err != nil {
+ p.logger.Error("failed to serialize vector",
+ "emb-len", len(row.Embeddings), "error", err)
+ return err
+ }
+ stmt.BindInt(1, int(row.ID))
+ stmt.BindBlob(2, v)
+ stmt.BindText(3, row.Slug)
+ stmt.BindText(4, row.RawText)
+ err = stmt.Exec()
+ if err != nil {
+ p.logger.Error("failed exec a stmt", "error", err)
+ return err
+ }
+ return nil
+}
+
+func decodeUnsafe(bs []byte) []float32 {
+ return unsafe.Slice((*float32)(unsafe.Pointer(&bs[0])), len(bs)/4)
+}
+
+func (p ProviderSQL) SearchClosest(q [5120]float32) (*models.VectorRow, error) {
+ stmt, _, err := p.s3Conn.Prepare(`
+ SELECT
+ id,
+ distance,
+ embedding,
+ slug,
+ raw_text
+ FROM vec_items
+ WHERE embedding MATCH ?
+ ORDER BY distance
+ LIMIT 4
+ `)
+ if err != nil {
+ log.Fatal(err)
+ }
+ query, err := sqlite_vec.SerializeFloat32(q[:])
+ if err != nil {
+ log.Fatal(err)
+ }
+ stmt.BindBlob(1, query)
+ resp := make([]models.VectorRow, 4)
+ i := 0
+ for stmt.Step() {
+ resp[i].ID = uint32(stmt.ColumnInt64(0))
+ resp[i].Distance = float32(stmt.ColumnFloat(1))
+ emb := stmt.ColumnRawText(2)
+ resp[i].Embeddings = decodeUnsafe(emb)
+ resp[i].Slug = stmt.ColumnText(3)
+ resp[i].RawText = stmt.ColumnText(4)
+ i++
+ }
+ if err := stmt.Err(); err != nil {
+ log.Fatal(err)
+ }
+ err = stmt.Close()
+ if err != nil {
+ log.Fatal(err)
+ }
+ return nil, nil
+}