Spaces:

retopara
/

ragflow

Build error

Kevin Hu commited on Dec 19, 2024

Commit

541b2f3

1 Parent(s): fea9976

Make fast embed and default embed mutually exclusive. (#4121)

### What problem does this PR solve?

### Type of change

- [x] Performance Improvement

Files changed (1) hide show

rag/llm/embedding_model.py CHANGED Viewed

@@ -251,11 +251,8 @@ class OllamaEmbed(Base):
         return np.array(res["embedding"]), 128
-class FastEmbed(Base):
-    _model = None
-    _model_name = ""
-    _model_lock = threading.Lock()
     def __init__(
             self,
             key: str | None = None,
@@ -267,17 +264,17 @@ class FastEmbed(Base):
         if not settings.LIGHTEN and not FastEmbed._model:
             with FastEmbed._model_lock:
                 from fastembed import TextEmbedding
-                if not FastEmbed._model or model_name != FastEmbed._model_name:
                     try:
-                        FastEmbed._model = TextEmbedding(model_name, cache_dir, threads, **kwargs)
-                        FastEmbed._model_name = model_name
                     except Exception:
                         cache_dir = snapshot_download(repo_id="BAAI/bge-small-en-v1.5",
                                                       local_dir=os.path.join(get_home_cache_dir(),
                                                                              re.sub(r"^[a-zA-Z0-9]+/", "", model_name)),
                                                       local_dir_use_symlinks=False)
-                        FastEmbed._model = TextEmbedding(model_name, cache_dir, threads, **kwargs)
-        self._model = FastEmbed._model
         self._model_name = model_name
     def encode(self, texts: list):

         return np.array(res["embedding"]), 128
+class FastEmbed(DefaultEmbedding):
     def __init__(
             self,
             key: str | None = None,
         if not settings.LIGHTEN and not FastEmbed._model:
             with FastEmbed._model_lock:
                 from fastembed import TextEmbedding
+                if not DefaultEmbedding._model or model_name != DefaultEmbedding._model_name:
                     try:
+                        DefaultEmbedding._model = TextEmbedding(model_name, cache_dir, threads, **kwargs)
+                        DefaultEmbedding._model_name = model_name
                     except Exception:
                         cache_dir = snapshot_download(repo_id="BAAI/bge-small-en-v1.5",
                                                       local_dir=os.path.join(get_home_cache_dir(),
                                                                              re.sub(r"^[a-zA-Z0-9]+/", "", model_name)),
                                                       local_dir_use_symlinks=False)
+                        DefaultEmbedding._model = TextEmbedding(model_name, cache_dir, threads, **kwargs)
+        self._model = DefaultEmbedding._model
         self._model_name = model_name
     def encode(self, texts: list):