keithbourne commited on
Commit
43035cf
·
verified ·
1 Parent(s): fbb9153

Upload inference.py

Browse files
Files changed (1) hide show
  1. inference.py +11 -0
inference.py ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # inference.py
2
+
3
+ from text_embeddings_runner import EmbeddingRunner
4
+
5
+ def create_runner():
6
+ # Force PyTorch runner on GPU
7
+ return EmbeddingRunner.from_pretrained(
8
+ repo_id="magnifi/optimized-semcache-embeds-en-final",
9
+ backend="pytorch",
10
+ device="cuda"
11
+ )