Spaces:

retopara
/

ragflow

Build error

KevinHuSh commited on Mar 27, 2024

Commit

adb65d7

1 Parent(s): f6d3d52

refine OpenAi Api (#159)

Files changed (5) hide show

README.md CHANGED Viewed

@@ -127,7 +127,7 @@ Open your browser, enter the IP address of your server, _**Hallelujah**_ again!
 # System Architecture Diagram
 <div align="center" style="margin-top:20px;margin-bottom:20px;">
-<img src="https://github.com/infiniflow/ragflow/assets/12318111/39c8e546-51ca-4b50-a1da-83731b540cd0" width="1000"/>
 </div>
 # Configuration

 # System Architecture Diagram
 <div align="center" style="margin-top:20px;margin-bottom:20px;">
+<img src="https://github.com/infiniflow/ragflow/assets/12318111/d6ac5664-c237-4200-a7c2-a4a00691b485" width="1000"/>
 </div>
 # Configuration

api/apps/llm_app.py CHANGED Viewed

@@ -51,7 +51,7 @@ def set_api_key():
                 if len(arr[0]) == 0 or tc == 0:
                     raise Exception("Fail")
             except Exception as e:
-                msg += f"\nFail to access embedding model({llm.llm_name}) using this api key."
         elif not chat_passed and llm.model_type == LLMType.CHAT.value:
             mdl = ChatModel[factory](
                 req["api_key"], llm.llm_name)

                 if len(arr[0]) == 0 or tc == 0:
                     raise Exception("Fail")
             except Exception as e:
+                msg += f"\nFail to access embedding model({llm.llm_name}) using this api key." + str(e)
         elif not chat_passed and llm.model_type == LLMType.CHAT.value:
             mdl = ChatModel[factory](
                 req["api_key"], llm.llm_name)

rag/app/picture.py CHANGED Viewed

@@ -29,7 +29,7 @@ def chunk(filename, binary, tenant_id, lang, callback=None, **kwargs):
     except Exception as e:
         callback(prog=-1, msg=str(e))
         return []
-    img = Image.open(io.BytesIO(binary))
     doc = {
         "docnm_kwd": filename,
         "image": img

     except Exception as e:
         callback(prog=-1, msg=str(e))
         return []
+    img = Image.open(io.BytesIO(binary)).convert('RGB')
     doc = {
         "docnm_kwd": filename,
         "image": img

rag/llm/chat_model.py CHANGED Viewed

@@ -43,8 +43,8 @@ class GptTurbo(Base):
                 model=self.model_name,
                 messages=history,
                 **gen_conf)
-            ans = response.output.choices[0]['message']['content'].strip()
-            if response.output.choices[0].get("finish_reason", "") == "length":
                 ans += "...\nFor the content length reason, it stopped, continue?" if is_english(
                     [ans]) else "······\n由于长度的原因，回答被截断了，要继续吗？"
             return ans, response.usage.completion_tokens
@@ -114,12 +114,12 @@ class ZhipuChat(Base):
             history.insert(0, {"role": "system", "content": system})
         try:
             response = self.client.chat.completions.create(
-                self.model_name,
                 messages=history,
                 **gen_conf
             )
-            ans = response.output.choices[0]['message']['content'].strip()
-            if response.output.choices[0].get("finish_reason", "") == "length":
                 ans += "...\nFor the content length reason, it stopped, continue?" if is_english(
                     [ans]) else "······\n由于长度的原因，回答被截断了，要继续吗？"
             return ans, response.usage.completion_tokens

                 model=self.model_name,
                 messages=history,
                 **gen_conf)
+            ans = response.choices[0].message.content.strip()
+            if response.choices[0].finish_reason == "length":
                 ans += "...\nFor the content length reason, it stopped, continue?" if is_english(
                     [ans]) else "······\n由于长度的原因，回答被截断了，要继续吗？"
             return ans, response.usage.completion_tokens
             history.insert(0, {"role": "system", "content": system})
         try:
             response = self.client.chat.completions.create(
+                model=self.model_name,
                 messages=history,
                 **gen_conf
             )
+            ans = response.choices[0].message.content.strip()
+            if response.choices[0].finish_reason == "length":
                 ans += "...\nFor the content length reason, it stopped, continue?" if is_english(
                     [ans]) else "······\n由于长度的原因，回答被截断了，要继续吗？"
             return ans, response.usage.completion_tokens

rag/llm/embedding_model.py CHANGED Viewed

@@ -139,12 +139,16 @@ class ZhipuEmbed(Base):
         self.model_name = model_name
     def encode(self, texts: list, batch_size=32):
-        res = self.client.embeddings.create(input=texts,
                                             model=self.model_name)
-        return np.array([d.embedding for d in res.data]
-                        ), res.usage.total_tokens
     def encode_queries(self, text):
         res = self.client.embeddings.create(input=text,
                                             model=self.model_name)
-        return np.array(res["data"][0]["embedding"]), res.usage.total_tokens

         self.model_name = model_name
     def encode(self, texts: list, batch_size=32):
+        arr = []
+        tks_num = 0
+        for txt in texts:
+            res = self.client.embeddings.create(input=txt,
                                             model=self.model_name)
+            arr.append(res.data[0].embedding)
+            tks_num += res.usage.total_tokens
+        return np.array(arr), tks_num
     def encode_queries(self, text):
         res = self.client.embeddings.create(input=text,
                                             model=self.model_name)
+        return np.array(res.data[0].embedding), res.usage.total_tokens