Spaces:

retopara
/

ragflow

Build error

App Files Files Community

yungongzi

OnePieceMan commited on May 28, 2024

Commit

d7bf446

1 Parent(s): 6cb617c

Added support for Baichuan LLM (#934)

Browse files

### What problem does this PR solve?

- Added support for Baichuan LLM

### Type of change

- [x] New Feature (non-breaking change which adds functionality)

Co-authored-by: 海贼宅 <[email protected]>

Files changed (6) hide show

api/db/init_data.py +49 -1
rag/llm/__init__.py +4 -2
rag/llm/chat_model.py +78 -0
rag/llm/embedding_model.py +9 -0
web/src/assets/svg/llm/baichuan.svg +28 -0
web/src/pages/user-setting/setting-model/index.tsx +1 -0

api/db/init_data.py CHANGED Viewed

@@ -137,7 +137,12 @@ factory_infos = [{
     "logo": "",
     "tags": "LLM, TEXT EMBEDDING",
     "status": "1",
-}
     # {
     #     "name": "文心一言",
     #     "logo": "",
@@ -392,6 +397,49 @@ def init_llm_factory():
             "max_tokens": 4096,
             "model_type": LLMType.CHAT.value
         },
     ]
     for info in factory_infos:
         try:

     "logo": "",
     "tags": "LLM, TEXT EMBEDDING",
     "status": "1",
+},{
+    "name": "BaiChuan",
+    "logo": "",
+    "tags": "LLM,TEXT EMBEDDING",
+    "status": "1",
+},
     # {
     #     "name": "文心一言",
     #     "logo": "",
             "max_tokens": 4096,
             "model_type": LLMType.CHAT.value
         },
+        # ------------------------ BaiChuan -----------------------
+        {
+            "fid": factory_infos[10]["name"],
+            "llm_name": "Baichuan2-Turbo",
+            "tags": "LLM,CHAT,32K",
+            "max_tokens": 32768,
+            "model_type": LLMType.CHAT.value
+        },
+        {
+            "fid": factory_infos[10]["name"],
+            "llm_name": "Baichuan2-Turbo-192k",
+            "tags": "LLM,CHAT,192K",
+            "max_tokens": 196608,
+            "model_type": LLMType.CHAT.value
+        },
+        {
+            "fid": factory_infos[10]["name"],
+            "llm_name": "Baichuan3-Turbo",
+            "tags": "LLM,CHAT,32K",
+            "max_tokens": 32768,
+            "model_type": LLMType.CHAT.value
+        },
+        {
+            "fid": factory_infos[10]["name"],
+            "llm_name": "Baichuan3-Turbo-128k",
+            "tags": "LLM,CHAT,128K",
+            "max_tokens": 131072,
+            "model_type": LLMType.CHAT.value
+        },
+        {
+            "fid": factory_infos[10]["name"],
+            "llm_name": "Baichuan4",
+            "tags": "LLM,CHAT,128K",
+            "max_tokens": 131072,
+            "model_type": LLMType.CHAT.value
+        },
+        {
+            "fid": factory_infos[10]["name"],
+            "llm_name": "Baichuan-Text-Embedding",
+            "tags": "TEXT EMBEDDING",
+            "max_tokens": 512,
+            "model_type": LLMType.EMBEDDING.value
+        },
     ]
     for info in factory_infos:
         try:

rag/llm/__init__.py CHANGED Viewed

@@ -26,7 +26,8 @@ EmbeddingModel = {
     "ZHIPU-AI": ZhipuEmbed,
     "FastEmbed": FastEmbed,
     "Youdao": YoudaoEmbed,
-    "DeepSeek": DefaultEmbedding
 }
@@ -47,6 +48,7 @@ ChatModel = {
     "Ollama": OllamaChat,
     "Xinference": XinferenceChat,
     "Moonshot": MoonshotChat,
-    "DeepSeek": DeepSeekChat
 }

     "ZHIPU-AI": ZhipuEmbed,
     "FastEmbed": FastEmbed,
     "Youdao": YoudaoEmbed,
+    "DeepSeek": DefaultEmbedding,
+    "BaiChuan": BaiChuanEmbed
 }
     "Ollama": OllamaChat,
     "Xinference": XinferenceChat,
     "Moonshot": MoonshotChat,
+    "DeepSeek": DeepSeekChat,
+    "BaiChuan": BaiChuanChat
 }

rag/llm/chat_model.py CHANGED Viewed

@@ -95,6 +95,84 @@ class DeepSeekChat(Base):
         super().__init__(key, model_name, base_url)
 class QWenChat(Base):
     def __init__(self, key, model_name=Generation.Models.qwen_turbo, **kwargs):
         import dashscope

         super().__init__(key, model_name, base_url)
+class BaiChuanChat(Base):
+    def __init__(self, key, model_name="Baichuan3-Turbo", base_url="https://api.baichuan-ai.com/v1"):
+        if not base_url:
+            base_url = "https://api.baichuan-ai.com/v1"
+        super().__init__(key, model_name, base_url)
+    @staticmethod
+    def _format_params(params):
+        return {
+            "temperature": params.get("temperature", 0.3),
+            "max_tokens": params.get("max_tokens", 2048),
+            "top_p": params.get("top_p", 0.85),
+        }
+    def chat(self, system, history, gen_conf):
+        if system:
+            history.insert(0, {"role": "system", "content": system})
+        try:
+            response = self.client.chat.completions.create(
+                model=self.model_name,
+                messages=history,
+                extra_body={
+                    "tools": [{
+                        "type": "web_search",
+                        "web_search": {
+                            "enable": True,
+                            "search_mode": "performance_first"
+                        }
+                    }]
+                },
+                **self._format_params(gen_conf))
+            ans = response.choices[0].message.content.strip()
+            if response.choices[0].finish_reason == "length":
+                ans += "...\nFor the content length reason, it stopped, continue?" if is_english(
+                    [ans]) else "······\n由于长度的原因，回答被截断了，要继续吗？"
+            return ans, response.usage.total_tokens
+        except openai.APIError as e:
+            return "**ERROR**: " + str(e), 0
+    def chat_streamly(self, system, history, gen_conf):
+        if system:
+            history.insert(0, {"role": "system", "content": system})
+        ans = ""
+        total_tokens = 0
+        try:
+            response = self.client.chat.completions.create(
+                model=self.model_name,
+                messages=history,
+                extra_body={
+                    "tools": [{
+                        "type": "web_search",
+                        "web_search": {
+                            "enable": True,
+                            "search_mode": "performance_first"
+                        }
+                    }]
+                },
+                stream=True,
+                **self._format_params(gen_conf))
+            for resp in response:
+                if resp.choices[0].finish_reason == "stop":
+                    if not resp.choices[0].delta.content:
+                        continue
+                    total_tokens = resp.usage.get('total_tokens', 0)
+                if not resp.choices[0].delta.content:
+                    continue
+                ans += resp.choices[0].delta.content
+                if resp.choices[0].finish_reason == "length":
+                    ans += "...\nFor the content length reason, it stopped, continue?" if is_english(
+                        [ans]) else "······\n由于长度的原因，回答被截断了，要继续吗？"
+                yield ans
+        except Exception as e:
+            yield ans + "\n**ERROR**: " + str(e)
+        yield total_tokens
 class QWenChat(Base):
     def __init__(self, key, model_name=Generation.Models.qwen_turbo, **kwargs):
         import dashscope

rag/llm/embedding_model.py CHANGED Viewed

@@ -104,6 +104,15 @@ class OpenAIEmbed(Base):
         return np.array(res.data[0].embedding), res.usage.total_tokens
 class QWenEmbed(Base):
     def __init__(self, key, model_name="text_embedding_v2", **kwargs):
         dashscope.api_key = key

         return np.array(res.data[0].embedding), res.usage.total_tokens
+class BaiChuanEmbed(OpenAIEmbed):
+    def __init__(self, key,
+                 model_name='Baichuan-Text-Embedding',
+                 base_url='https://api.baichuan-ai.com/v1'):
+        if not base_url:
+            base_url = "https://api.baichuan-ai.com/v1"
+        super().__init__(key, model_name, base_url)
 class QWenEmbed(Base):
     def __init__(self, key, model_name="text_embedding_v2", **kwargs):
         dashscope.api_key = key

web/src/assets/svg/llm/baichuan.svg ADDED Viewed

web/src/pages/user-setting/setting-model/index.tsx CHANGED Viewed

@@ -55,6 +55,7 @@ const IconMap = {
   Xinference: 'xinference',
   DeepSeek: 'deepseek',
   VolcEngine: 'volc_engine',
 };
 const LlmIcon = ({ name }: { name: string }) => {

   Xinference: 'xinference',
   DeepSeek: 'deepseek',
   VolcEngine: 'volc_engine',
+  BaiChuan: 'baichuan',
 };
 const LlmIcon = ({ name }: { name: string }) => {