Spaces:
Sleeping
Sleeping
File size: 1,044 Bytes
e37fa39 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 |
from langchain_community.embeddings import HuggingFaceEmbeddings
from loader import load_and_split_markdown
# from langchain.vectorstores import FAISS
from langchain_community.vectorstores import FAISS
from langchain_community.vectorstores.utils import DistanceStrategy
from huggingface_hub.utils import disable_progress_bars
disable_progress_bars() # Отключает прогресс-бары загрузки
def get_retriever(name='intfloat/multilingual-e5-large'):
# Убираем multi_process для Windows
embedding_model = HuggingFaceEmbeddings(
model_name=name,
model_kwargs={"device": "cpu"},
encode_kwargs={
"normalize_embeddings": True,
"batch_size": 4 # Уменьшаем batch_size для CPU
}
)
docs_processed=load_and_split_markdown()
KNOWLEDGE_VECTOR_DATABASE = FAISS.from_documents(
documents=docs_processed, embedding=embedding_model, distance_strategy=DistanceStrategy.COSINE )
return embedding_model, KNOWLEDGE_VECTOR_DATABASE |