Magjot commited on
Commit
ab07bea
·
verified ·
1 Parent(s): 255899c

Upload handler.py

Browse files
Files changed (1) hide show
  1. handler.py +18 -0
handler.py ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from transformers import AutoModelForCausalLM, AutoTokenizer
2
+ import torch
3
+ import os
4
+
5
+ class EndpointHandler:
6
+ def __init__(self, path=""):
7
+ self.tokenizer = AutoTokenizer.from_pretrained(path)
8
+ self.model = AutoModelForCausalLM.from_pretrained(path, torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32)
9
+ self.model.eval()
10
+
11
+ def __call__(self, inputs: dict):
12
+ prompt = inputs.get("inputs", "")
13
+ if not prompt:
14
+ return {"error": "No input provided."}
15
+ input_ids = self.tokenizer(prompt, return_tensors="pt").input_ids
16
+ outputs = self.model.generate(input_ids=input_ids, max_new_tokens=100)
17
+ generated = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
18
+ return {"generated_text": generated}