mirror of
https://github.com/asg017/sqlite-vec.git
synced 2026-04-25 16:56:27 +02:00
17 lines
374 B
Python
17 lines
374 B
Python
|
|
import numpy as np
|
||
|
|
import duckdb
|
||
|
|
db = duckdb.connect(":memory:")
|
||
|
|
|
||
|
|
result = db.execute(
|
||
|
|
"""
|
||
|
|
select
|
||
|
|
-- _id,
|
||
|
|
-- title,
|
||
|
|
-- text as contents,
|
||
|
|
embedding::float[] as embeddings
|
||
|
|
from "hf://datasets/Supabase/dbpedia-openai-3-large-1M/dbpedia_openai_3_large_00.parquet"
|
||
|
|
"""
|
||
|
|
).fetchnumpy()['embeddings']
|
||
|
|
|
||
|
|
np.save("dbpedia_openai_3_large_00.npy", np.vstack(result))
|