20 lines
553 B
Python
20 lines
553 B
Python
from langchain_chroma import Chroma
|
|
import os
|
|
|
|
|
|
def create_vectorstore(docs_split: list, embeddings, file_name: str):
|
|
db_name: str = file_name.replace(".pdf", "").replace(" ", "_").lower()
|
|
persist_directory: str = f"embeddings/{db_name}"
|
|
|
|
# Crear el directorio si no existe
|
|
os.makedirs(persist_directory, exist_ok=True)
|
|
|
|
# Siempre crear/actualizar el vectorstore
|
|
vectordb = Chroma.from_documents(
|
|
persist_directory=persist_directory,
|
|
documents=docs_split,
|
|
embedding=embeddings,
|
|
)
|
|
|
|
return vectordb
|