fix: Fix OpenAI batch embedding

This commit is contained in:
Hwang In Tak 2024-09-26 20:39:40 +09:00
parent be41994d40
commit a4bc0b2829
No known key found for this signature in database
3 changed files with 3 additions and 7 deletions

View File

@ -1112,13 +1112,15 @@ def store_docs_in_vector_db(
app.state.config.RAG_EMBEDDING_OPENAI_BATCH_SIZE, app.state.config.RAG_EMBEDDING_OPENAI_BATCH_SIZE,
) )
embedding_texts = list(map(lambda x: x.replace("\n", " "), texts))
VECTOR_DB_CLIENT.insert( VECTOR_DB_CLIENT.insert(
collection_name=collection_name, collection_name=collection_name,
items=[ items=[
{ {
"id": str(uuid.uuid4()), "id": str(uuid.uuid4()),
"text": text, "text": text,
"vector": embedding_function(text.replace("\n", " ")), "vector": embedding_texts[idx],
"metadata": metadatas[idx], "metadata": metadatas[idx],
} }
for idx, text in enumerate(texts) for idx, text in enumerate(texts)

View File

@ -76,8 +76,6 @@ def query_doc(
limit=k, limit=k,
) )
print("result", result)
log.info(f"query_doc:result {result}") log.info(f"query_doc:result {result}")
return result return result
except Exception as e: except Exception as e:

View File

@ -16,8 +16,6 @@ class MilvusClient:
self.client = Client(uri=MILVUS_URI) self.client = Client(uri=MILVUS_URI)
def _result_to_get_result(self, result) -> GetResult: def _result_to_get_result(self, result) -> GetResult:
print(result)
ids = [] ids = []
documents = [] documents = []
metadatas = [] metadatas = []
@ -45,8 +43,6 @@ class MilvusClient:
) )
def _result_to_search_result(self, result) -> SearchResult: def _result_to_search_result(self, result) -> SearchResult:
print(result)
ids = [] ids = []
distances = [] distances = []
documents = [] documents = []