Spaces:

retopara
/

ragflow

Build error

App Files Files Community

黄腾

aopstudio Kevin Hu commited on Aug 29, 2024

Commit

6f1cd9e

1 Parent(s): 24ab7dc

add support for Anthropic (#2148)

Browse files

### What problem does this PR solve?

#1853 add support for Anthropic

### Type of change

- [x] New Feature (non-breaking change which adds functionality)

---------

Co-authored-by: Zhedong Cen <[email protected]>
Co-authored-by: Kevin Hu <[email protected]>

Files changed (7) hide show

conf/llm_factories.json +50 -0
rag/llm/__init__.py +2 -1
rag/llm/chat_model.py +68 -4
requirements.txt +1 -0
requirements_arm.txt +1 -0
web/src/assets/svg/llm/anthropic.svg +1 -0
web/src/pages/user-setting/setting-model/constant.ts +1 -0

conf/llm_factories.json CHANGED Viewed

@@ -3240,6 +3240,56 @@
             "tags": "SPEECH2TEXT",
             "status": "1",
             "llm": []
         }
     ]
 }

             "tags": "SPEECH2TEXT",
             "status": "1",
             "llm": []
+        },
+        {
+            "name": "Anthropic",
+            "logo": "",
+            "tags": "LLM",
+            "status": "1",
+            "llm": [
+                {
+                    "llm_name": "claude-3-5-sonnet-20240620",
+                    "tags": "LLM,CHAT,200k",
+                    "max_tokens": 204800,
+                    "model_type": "chat"
+                },
+                {
+                    "llm_name": "claude-3-opus-20240229",
+                    "tags": "LLM,CHAT,200k",
+                    "max_tokens": 204800,
+                    "model_type": "chat"
+                },
+                {
+                    "llm_name": "claude-3-sonnet-20240229",
+                    "tags": "LLM,CHAT,200k",
+                    "max_tokens": 204800,
+                    "model_type": "chat"
+                },
+                {
+                    "llm_name": "claude-3-haiku-20240307",
+                    "tags": "LLM,CHAT,200k",
+                    "max_tokens": 204800,
+                    "model_type": "chat"
+                },
+                {
+                    "llm_name": "claude-2.1",
+                    "tags": "LLM,CHAT,200k",
+                    "max_tokens": 204800,
+                    "model_type": "chat"
+                },
+                {
+                    "llm_name": "claude-2.0",
+                    "tags": "LLM,CHAT,100k",
+                    "max_tokens": 102400,
+                    "model_type": "chat"
+                },
+                {
+                    "llm_name": "claude-instant-1.2",
+                    "tags": "LLM,CHAT,100k",
+                    "max_tokens": 102400,
+                    "model_type": "chat"
+                }
+            ]
         }
     ]
 }

rag/llm/__init__.py CHANGED Viewed

@@ -104,7 +104,8 @@ ChatModel = {
     "Replicate": ReplicateChat,
     "Tencent Hunyuan": HunyuanChat,
     "XunFei Spark": SparkChat,
-    "BaiduYiyan": BaiduYiyanChat
 }

     "Replicate": ReplicateChat,
     "Tencent Hunyuan": HunyuanChat,
     "XunFei Spark": SparkChat,
+    "BaiduYiyan": BaiduYiyanChat,
+    "Anthropic": AnthropicChat
 }

rag/llm/chat_model.py CHANGED Viewed

@@ -1132,7 +1132,7 @@ class SparkChat(Base):
 class BaiduYiyanChat(Base):
     def __init__(self, key, model_name, base_url=None):
         import qianfan
         key = json.loads(key)
         ak = key.get("yiyan_ak","")
         sk = key.get("yiyan_sk","")
@@ -1149,7 +1149,7 @@ class BaiduYiyanChat(Base):
         if "max_tokens" in gen_conf:
             gen_conf["max_output_tokens"] = gen_conf["max_tokens"]
         ans = ""
         try:
             response = self.client.do(
                 model=self.model_name,
@@ -1159,7 +1159,7 @@ class BaiduYiyanChat(Base):
             ).body
             ans = response['result']
             return ans, response["usage"]["total_tokens"]
         except Exception as e:
             return ans + "\n**ERROR**: " + str(e), 0
@@ -1173,7 +1173,7 @@ class BaiduYiyanChat(Base):
             gen_conf["max_output_tokens"] = gen_conf["max_tokens"]
         ans = ""
         total_tokens = 0
         try:
             response = self.client.do(
                 model=self.model_name,
@@ -1193,3 +1193,67 @@ class BaiduYiyanChat(Base):
             return ans + "\n**ERROR**: " + str(e), 0
         yield total_tokens

 class BaiduYiyanChat(Base):
     def __init__(self, key, model_name, base_url=None):
         import qianfan
         key = json.loads(key)
         ak = key.get("yiyan_ak","")
         sk = key.get("yiyan_sk","")
         if "max_tokens" in gen_conf:
             gen_conf["max_output_tokens"] = gen_conf["max_tokens"]
         ans = ""
         try:
             response = self.client.do(
                 model=self.model_name,
             ).body
             ans = response['result']
             return ans, response["usage"]["total_tokens"]
         except Exception as e:
             return ans + "\n**ERROR**: " + str(e), 0
             gen_conf["max_output_tokens"] = gen_conf["max_tokens"]
         ans = ""
         total_tokens = 0
         try:
             response = self.client.do(
                 model=self.model_name,
             return ans + "\n**ERROR**: " + str(e), 0
         yield total_tokens
+class AnthropicChat(Base):
+    def __init__(self, key, model_name, base_url=None):
+        import anthropic
+        self.client = anthropic.Anthropic(api_key=key)
+        self.model_name = model_name
+        self.system = ""
+    def chat(self, system, history, gen_conf):
+        if system:
+            self.system = system
+        if "max_tokens" not in gen_conf:
+            gen_conf["max_tokens"] = 4096
+        try:
+            response = self.client.messages.create(
+                model=self.model_name,
+                messages=history,
+                system=self.system,
+                stream=False,
+                **gen_conf,
+            ).json()
+            ans = response["content"][0]["text"]
+            if response["stop_reason"] == "max_tokens":
+                ans += (
+                    "...\nFor the content length reason, it stopped, continue?"
+                    if is_english([ans])
+                    else "······\n由于长度的原因，回答被截断了，要继续吗？"
+                )
+            return (
+                ans,
+                response["usage"]["input_tokens"] + response["usage"]["output_tokens"],
+            )
+        except Exception as e:
+            return ans + "\n**ERROR**: " + str(e), 0
+    def chat_streamly(self, system, history, gen_conf):
+        if system:
+            self.system = system
+        if "max_tokens" not in gen_conf:
+            gen_conf["max_tokens"] = 4096
+        ans = ""
+        total_tokens = 0
+        try:
+            response = self.client.messages.create(
+                model=self.model_name,
+                messages=history,
+                system=self.system,
+                stream=True,
+                **gen_conf,
+            )
+            for res in response.iter_lines():
+                res = res.decode("utf-8")
+                if "content_block_delta" in res and "data" in res:
+                    text = json.loads(res[6:])["delta"]["text"]
+                    ans += text
+                    total_tokens += num_tokens_from_string(text)
+        except Exception as e:
+            yield ans + "\n**ERROR**: " + str(e)
+        yield total_tokens

requirements.txt CHANGED Viewed

@@ -1,3 +1,4 @@
 arxiv==2.1.3
 Aspose.Slides==24.2.0
 BCEmbedding==0.1.3

+anthropic===0.34.1
 arxiv==2.1.3
 Aspose.Slides==24.2.0
 BCEmbedding==0.1.3

requirements_arm.txt CHANGED Viewed

@@ -2,6 +2,7 @@ accelerate==0.27.2
 aiohttp==3.9.4
 aiosignal==1.3.1
 annotated-types==0.6.0
 anyio==4.3.0
 argon2-cffi==23.1.0
 argon2-cffi-bindings==21.2.0

 aiohttp==3.9.4
 aiosignal==1.3.1
 annotated-types==0.6.0
+anthropic===0.34.1
 anyio==4.3.0
 argon2-cffi==23.1.0
 argon2-cffi-bindings==21.2.0

web/src/assets/svg/llm/anthropic.svg ADDED Viewed

web/src/pages/user-setting/setting-model/constant.ts CHANGED Viewed

@@ -37,6 +37,7 @@ export const IconMap = {
   BaiduYiyan: 'yiyan',
   'Fish Audio': 'fish-audio',
   'Tencent Cloud': 'tencent-cloud',
 };
 export const BedrockRegionList = [

   BaiduYiyan: 'yiyan',
   'Fish Audio': 'fish-audio',
   'Tencent Cloud': 'tencent-cloud',
+  Anthropic: 'anthropic',
 };
 export const BedrockRegionList = [