Spaces:

retopara
/

ragflow

Build error

App Files Files Community

黄腾

aopstudio Kevin Hu commited on Aug 29, 2024

Commit

b6bfae8

1 Parent(s): 4636d13

add support for Voyage AI (#2159)

Browse files

### What problem does this PR solve?

#1853 #2138 add support for Voyage AI

### Type of change
- [x] New Feature (non-breaking change which adds functionality)

---------

Co-authored-by: Zhedong Cen <[email protected]>
Co-authored-by: Kevin Hu <[email protected]>

Files changed (9) hide show

conf/llm_factories.json +63 -1
rag/llm/__init__.py +5 -3
rag/llm/embedding_model.py +21 -0
rag/llm/rerank_model.py +16 -0
requirements.txt +1 -0
requirements_arm.txt +1 -0
web/src/assets/svg/llm/{lepton.svg → lepton-ai.svg} +0 -0
web/src/assets/svg/llm/voyage.svg +32 -0
web/src/pages/user-setting/setting-model/constant.ts +2 -1

conf/llm_factories.json CHANGED Viewed

@@ -2400,7 +2400,7 @@
             ]
         },
         {
-            "name": "Lepton",
             "logo": "",
             "tags": "LLM",
             "status": "1",
@@ -3290,6 +3290,68 @@
                     "model_type": "chat"
                 }
             ]
         }
     ]
 }

             ]
         },
         {
+            "name": "LeptonAI",
             "logo": "",
             "tags": "LLM",
             "status": "1",
                     "model_type": "chat"
                 }
             ]
+        },
+        {
+            "name": "Voyage AI",
+            "logo": "",
+            "tags": "TEXT EMBEDDING, TEXT RE-RANK",
+            "status": "1",
+            "llm": [
+                {
+                    "llm_name": "voyage-large-2-instruct",
+                    "tags": "TEXT EMBEDDING,16000",
+                    "max_tokens": 16000,
+                    "model_type": "embedding"
+                },
+                {
+                    "llm_name": "voyage-finance-2",
+                    "tags": "TEXT EMBEDDING,32000",
+                    "max_tokens": 32000,
+                    "model_type": "embedding"
+                },
+                {
+                    "llm_name": "voyage-multilingual-2",
+                    "tags": "TEXT EMBEDDING,32000",
+                    "max_tokens": 32000,
+                    "model_type": "embedding"
+                },
+                {
+                    "llm_name": "voyage-law-2",
+                    "tags": "TEXT EMBEDDING,16000",
+                    "max_tokens": 16000,
+                    "model_type": "embedding"
+                },
+                {
+                    "llm_name": "voyage-code-2",
+                    "tags": "TEXT EMBEDDING,16000",
+                    "max_tokens": 16000,
+                    "model_type": "embedding"
+                },
+                {
+                    "llm_name": "voyage-large-2",
+                    "tags": "TEXT EMBEDDING,16000",
+                    "max_tokens": 16000,
+                    "model_type": "embedding"
+                },
+                {
+                    "llm_name": "voyage-2",
+                    "tags": "TEXT EMBEDDING,4000",
+                    "max_tokens": 4000,
+                    "model_type": "embedding"
+                },
+                {
+                    "llm_name": "rerank-1",
+                    "tags": "RE-RANK, 8000",
+                    "max_tokens": 8000,
+                    "model_type": "rerank"
+                },
+                {
+                    "llm_name": "rerank-lite-1",
+                    "tags": "RE-RANK, 4000",
+                    "max_tokens": 4000,
+                    "model_type": "rerank"
+                }
+            ]
         }
     ]
 }

rag/llm/__init__.py CHANGED Viewed

@@ -45,7 +45,8 @@ EmbeddingModel = {
     "Upstage": UpstageEmbed,
     "SILICONFLOW": SILICONFLOWEmbed,
     "Replicate": ReplicateEmbed,
-    "BaiduYiyan": BaiduYiyanEmbed
 }
@@ -105,7 +106,7 @@ ChatModel = {
     "Tencent Hunyuan": HunyuanChat,
     "XunFei Spark": SparkChat,
     "BaiduYiyan": BaiduYiyanChat,
-    "Anthropic": AnthropicChat
 }
@@ -120,7 +121,8 @@ RerankModel = {
     "cohere": CoHereRerank,
     "TogetherAI": TogetherAIRerank,
     "SILICONFLOW": SILICONFLOWRerank,
-    "BaiduYiyan": BaiduYiyanRerank
 }

     "Upstage": UpstageEmbed,
     "SILICONFLOW": SILICONFLOWEmbed,
     "Replicate": ReplicateEmbed,
+    "BaiduYiyan": BaiduYiyanEmbed,
+    "Voyage AI": VoyageEmbed
 }
     "Tencent Hunyuan": HunyuanChat,
     "XunFei Spark": SparkChat,
     "BaiduYiyan": BaiduYiyanChat,
+    "Anthropic": VoyageChat,
 }
     "cohere": CoHereRerank,
     "TogetherAI": TogetherAIRerank,
     "SILICONFLOW": SILICONFLOWRerank,
+    "BaiduYiyan": BaiduYiyanRerank,
+    "Voyage AI": VoyageRerank
 }

rag/llm/embedding_model.py CHANGED Viewed

@@ -623,3 +623,24 @@ class BaiduYiyanEmbed(Base):
             np.array([r["embedding"] for r in res["data"]]),
             res["usage"]["total_tokens"],
         )

             np.array([r["embedding"] for r in res["data"]]),
             res["usage"]["total_tokens"],
         )
+class VoyageEmbed(Base):
+    def __init__(self, key, model_name, base_url=None):
+        import voyageai
+        self.client = voyageai.Client(api_key=key)
+        self.model_name = model_name
+    def encode(self, texts: list, batch_size=32):
+        res = self.client.embed(
+            texts=texts, model=self.model_name, input_type="document"
+        )
+        return np.array(res.embeddings), res.total_tokens
+    def encode_queries(self, text):
+        res = self.client.embed
+        res = self.client.embed(
+            texts=text, model=self.model_name, input_type="query"
+            )
+        return np.array(res.embeddings), res.total_tokens

rag/llm/rerank_model.py CHANGED Viewed

@@ -311,3 +311,19 @@ class BaiduYiyanRerank(Base):
         rank = np.array([d["relevance_score"] for d in res["results"]])
         indexs = [d["index"] for d in res["results"]]
         return rank[indexs], res["usage"]["total_tokens"]

         rank = np.array([d["relevance_score"] for d in res["results"]])
         indexs = [d["index"] for d in res["results"]]
         return rank[indexs], res["usage"]["total_tokens"]
+class VoyageRerank(Base):
+    def __init__(self, key, model_name, base_url=None):
+        import voyageai
+        self.client = voyageai.Client(api_key=key)
+        self.model_name = model_name
+    def similarity(self, query: str, texts: list):
+        res = self.client.rerank(
+            query=query, documents=texts, model=self.model_name, top_k=len(texts)
+        )
+        rank = np.array([r.relevance_score for r in res.results])
+        indexs = [r.index for r in res.results]
+        return rank[indexs], res.total_tokens

requirements.txt CHANGED Viewed

@@ -86,6 +86,7 @@ torch==2.3.0
 transformers==4.38.1
 umap==0.1.1
 volcengine==1.0.146
 webdriver_manager==4.0.1
 Werkzeug==3.0.3
 wikipedia==1.4.0

 transformers==4.38.1
 umap==0.1.1
 volcengine==1.0.146
+voyageai==0.2.3
 webdriver_manager==4.0.1
 Werkzeug==3.0.3
 wikipedia==1.4.0

requirements_arm.txt CHANGED Viewed

@@ -141,6 +141,7 @@ loguru==0.7.2
 umap-learn
 fasttext==0.9.2
 volcengine==1.0.141
 opencv-python-headless==4.9.0.80
 readability-lxml==0.8.1
 html_text==0.6.2

 umap-learn
 fasttext==0.9.2
 volcengine==1.0.141
+voyageai==0.2.3
 opencv-python-headless==4.9.0.80
 readability-lxml==0.8.1
 html_text==0.6.2

web/src/assets/svg/llm/{lepton.svg → lepton-ai.svg} RENAMED Viewed

File without changes

web/src/assets/svg/llm/voyage.svg ADDED Viewed

web/src/pages/user-setting/setting-model/constant.ts CHANGED Viewed

@@ -24,7 +24,7 @@ export const IconMap = {
   'LM-Studio': 'lm-studio',
   'OpenAI-API-Compatible': 'openai-api',
   cohere: 'cohere',
-  Lepton: 'lepton',
   TogetherAI: 'together-ai',
   PerfXCloud: 'perfx-cloud',
   Upstage: 'upstage',
@@ -38,6 +38,7 @@ export const IconMap = {
   'Fish Audio': 'fish-audio',
   'Tencent Cloud': 'tencent-cloud',
   Anthropic: 'anthropic',
 };
 export const BedrockRegionList = [

   'LM-Studio': 'lm-studio',
   'OpenAI-API-Compatible': 'openai-api',
   cohere: 'cohere',
+  LeptonAI: 'lepton-ai',
   TogetherAI: 'together-ai',
   PerfXCloud: 'perfx-cloud',
   Upstage: 'upstage',
   'Fish Audio': 'fish-audio',
   'Tencent Cloud': 'tencent-cloud',
   Anthropic: 'anthropic',
+  'Voyage AI': 'voyage',
 };
 export const BedrockRegionList = [