Spaces:

retopara
/

ragflow

Build error

Kevin Hu commited on Aug 13, 2024

Commit

2118d99

1 Parent(s): 91751af

boost paralal of graphrag (#1924)

### What problem does this PR solve?

### Type of change

- [x] Performance Improvement

Files changed (1) hide show

graphrag/index.py CHANGED Viewed

@@ -61,11 +61,11 @@ def build_knowlege_graph_chunks(tenant_id: str, chunks: List[str], callback, ent
     assert left_token_count > 0, f"The LLM context length({llm_bdl.max_length}) is smaller than prompt({ext.prompt_token_count})"
-    BATCH_SIZE=1
     texts, graphs = [], []
     cnt = 0
     threads = []
-    exe = ThreadPoolExecutor(max_workers=12)
     for i in range(len(chunks)):
         tkn_cnt = num_tokens_from_string(chunks[i])
         if cnt+tkn_cnt >= left_token_count and texts:

     assert left_token_count > 0, f"The LLM context length({llm_bdl.max_length}) is smaller than prompt({ext.prompt_token_count})"
+    BATCH_SIZE=4
     texts, graphs = [], []
     cnt = 0
     threads = []
+    exe = ThreadPoolExecutor(max_workers=50)
     for i in range(len(chunks)):
         tkn_cnt = num_tokens_from_string(chunks[i])
         if cnt+tkn_cnt >= left_token_count and texts: