Spaces:

teapotai
/

teapotllm_discord_bot

Sleeping

zakerytclarke commited on Mar 26

Commit

d6c6437

verified ·

1 Parent(s): 00915d5

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -53,19 +53,17 @@ async def brave_search(query, count=1):
                 print(f"Error: {response.status}, {await response.text()}")
                 return []
 @traceable
 @log_time
-async def query_teapot(prompt, context, user_input):
     input_text = prompt + "\n" + context + "\n" + user_input
-    print(input_text)
     start_time = time.time()
     inputs = tokenizer(input_text, return_tensors="pt")
     input_length = inputs["input_ids"].shape[1]
-    # output = await asyncio.to_thread(model.generate, **inputs, max_new_tokens=512)
-    output = model.generate(inputs, max_new_tokens=512)
     output_text = tokenizer.decode(output[0], skip_special_tokens=True)
     total_length = output.shape[1]  # Includes both input and output tokens
@@ -78,7 +76,6 @@ async def query_teapot(prompt, context, user_input):
     return output_text
 @log_time
 async def handle_chat(user_input):
     search_start_time = time.time()

                 print(f"Error: {response.status}, {await response.text()}")
                 return []
 @traceable
 @log_time
+def query_teapot(prompt, context, user_input):
     input_text = prompt + "\n" + context + "\n" + user_input
     start_time = time.time()
     inputs = tokenizer(input_text, return_tensors="pt")
     input_length = inputs["input_ids"].shape[1]
+    output = model.generate(**inputs, max_new_tokens=512)
     output_text = tokenizer.decode(output[0], skip_special_tokens=True)
     total_length = output.shape[1]  # Includes both input and output tokens
     return output_text
 @log_time
 async def handle_chat(user_input):
     search_start_time = time.time()