Upload inference.py
Browse files- inference.py +11 -0
inference.py
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# inference.py
|
| 2 |
+
|
| 3 |
+
from text_embeddings_runner import EmbeddingRunner
|
| 4 |
+
|
| 5 |
+
def create_runner():
|
| 6 |
+
# Force PyTorch runner on GPU
|
| 7 |
+
return EmbeddingRunner.from_pretrained(
|
| 8 |
+
repo_id="magnifi/optimized-semcache-embeds-en-final",
|
| 9 |
+
backend="pytorch",
|
| 10 |
+
device="cuda"
|
| 11 |
+
)
|