Commit 9bda030e authored by jyong's avatar jyong

Merge branch 'feat/milvus-support' into deploy/dev

parents 76569834 37f5bb3d
...@@ -496,8 +496,9 @@ class IndexingRunner: ...@@ -496,8 +496,9 @@ class IndexingRunner:
# parse document to nodes # parse document to nodes
documents = splitter.split_documents([text_doc]) documents = splitter.split_documents([text_doc])
split_documents = []
def format_document(flask_app: Flask, document_node: Document, split_documents: List) -> List[Document]: def format_document(flask_app: Flask, document_node: Document) -> List[Document]:
with flask_app.app_context(): with flask_app.app_context():
print("process:"+document_node.page_content) print("process:"+document_node.page_content)
format_documents = [] format_documents = []
...@@ -528,20 +529,19 @@ class IndexingRunner: ...@@ -528,20 +529,19 @@ class IndexingRunner:
qa_documents.append(qa_document) qa_documents.append(qa_document)
format_documents.extend(qa_documents) format_documents.extend(qa_documents)
split_documents.append(format_documents) return format_documents
split_documents = [] # threads = []
threads = [] # for doc in documents:
for doc in documents: # document_format_thread = threading.Thread(target=format_document, kwargs={
document_format_thread = threading.Thread(target=format_document, kwargs={ # 'flask_app': current_app._get_current_object(), 'document_node': doc, 'split_documents': split_documents})
'flask_app': current_app._get_current_object(), 'document_node': doc, 'split_documents': split_documents}) # threads.append(document_format_thread)
threads.append(document_format_thread) # document_format_thread.start()
document_format_thread.start() # for thread in threads:
for thread in threads: # thread.join()
thread.join() with ThreadPoolExecutor(max_workers=10) as executor:
# with ThreadPoolExecutor() as executor: future_to_doc = {executor.submit(format_document, current_app._get_current_object(), doc): doc for doc in documents}
# future_to_doc = {executor.submit(format_document, current_app._get_current_object(), doc): doc for doc in documents} for future in concurrent.futures.as_completed(future_to_doc):
# for future in concurrent.futures.as_completed(future_to_doc): split_documents.extend(future.result())
# split_documents.extend(future.result())
all_documents.extend(split_documents) all_documents.extend(split_documents)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment