buster / embed_documents.py
jerpint's picture
add markdown parser (#5)
01b468b unverified
raw
history blame
No virus
430 Bytes
import pandas as pd
from buster.documents_manager import DeepLakeDocumentsManager
if __name__ == "__main__":
vector_store_path = "deeplake_store"
chunk_file = "langchain_course.csv"
overwrite = True
df = pd.read_csv(chunk_file)
dm = DeepLakeDocumentsManager(vector_store_path, overwrite=overwrite)
dm.batch_add(df)
zipped_file_path = dm.to_zip()
print(f"Contents zipped to: {zipped_file_path}")