Spaces:

akhaliq
/

Hunyuan-MT-7B

Running on Zero

akhaliq HF Staff commited on 1 day ago

Commit

a233e6e

verified ·

1 Parent(s): 7e76458

Upload app.py with huggingface_hub

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,10 +10,11 @@ print("Loading model... This may take a few minutes.")
 tokenizer = AutoTokenizer.from_pretrained(model_name_or_path)
 model = AutoModelForCausalLM.from_pretrained(
     model_name_or_path,
-    torch_dtype=torch.bfloat16 if torch.cuda.is_available() else torch.float32,
     device_map="auto"
 )
 def respond(message, history, system_message=None, max_tokens=None, temperature=None, top_p=None):
     """
     Generate response from Hunyuan-MT model

 tokenizer = AutoTokenizer.from_pretrained(model_name_or_path)
 model = AutoModelForCausalLM.from_pretrained(
     model_name_or_path,
+    torch_dtype=torch.bfloat16,
     device_map="auto"
 )
+@spaces.GPU(duration=120)
 def respond(message, history, system_message=None, max_tokens=None, temperature=None, top_p=None):
     """
     Generate response from Hunyuan-MT model