Gradio2-QnA

Runtime error

App Files Files Community

ssirikon commited on Sep 15, 2024

Commit

ee743ce

verified ·

1 Parent(s): 37d9be4

Update app.py

Browse files

Files changed (1) hide show

app.py +26 -15

app.py CHANGED Viewed

@@ -7,7 +7,7 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
 # Replace with your model name
 #MODEL_NAME = "ssirikon/Gemma7b-bnb-Unsloth"
 #MODEL_NAME = "unsloth/gemma-7b-bnb-4bit"
-MODEL_NAME = "Lohith9459/gemma7b"
 # Load the model and tokenizer
 max_seq_length = 512
@@ -20,14 +20,17 @@ load_in_4bit = True
 model = AutoModelForCausalLM.from_pretrained(MODEL_NAME, torch_dtype=torch.bfloat16, device_map="auto")
 tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
-def generate_subject(email_body):
-  instruction = "Generate a subject line for the following email."
   formatted_text = f"""Below is an instruction that describes a task. \
     Write a response that appropriately completes the request.
     ### Instruction:
     {instruction}
     ### Input:
-    {email_body}
     ### Response:
     """
   inputs = tokenizer([formatted_text], return_tensors="pt").to("cuda")
@@ -35,21 +38,29 @@ def generate_subject(email_body):
   generated_ids = model.generate(**inputs, streamer=text_streamer, max_new_tokens=512)
   generated_text = tokenizer.decode(generated_ids[0], skip_special_tokens=True)
-  def extract_subject(text):
-    start_tag = "### Response:"
-    start_idx = text.find(start_tag)
-    if start_idx == -1:
-        return None
-    subject = text[start_idx + len(start_tag):].strip()
-    return subject
-  return extract_subject(generated_text)
 # Create the Gradio interface
 demo = gr.Interface(
-    fn=generate_subject,
-    inputs=gr.Textbox(lines=20, label="Email Body"),
-    outputs=gr.Textbox(label="Generated Subject")
 )
 demo.launch()

 # Replace with your model name
 #MODEL_NAME = "ssirikon/Gemma7b-bnb-Unsloth"
 #MODEL_NAME = "unsloth/gemma-7b-bnb-4bit"
+MODEL_NAME = "Lohith9459/QnAD2_gemma7b"
 # Load the model and tokenizer
 max_seq_length = 512
 model = AutoModelForCausalLM.from_pretrained(MODEL_NAME, torch_dtype=torch.bfloat16, device_map="auto")
 tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
+def generate_answer(question):
+  instruction = "Generate an answer for the following question in less than two sentences."
   formatted_text = f"""Below is an instruction that describes a task. \
     Write a response that appropriately completes the request.
     ### Instruction:
     {instruction}
     ### Input:
+    {question}
     ### Response:
     """
   inputs = tokenizer([formatted_text], return_tensors="pt").to("cuda")
   generated_ids = model.generate(**inputs, streamer=text_streamer, max_new_tokens=512)
   generated_text = tokenizer.decode(generated_ids[0], skip_special_tokens=True)
+  def get_answer(text):
+      start_tag = "### Response:"
+      # Find the start and end indices
+      start_idx = text.find(start_tag)
+      # Check if both tags are found
+      if start_idx == -1:
+          return None  # Tags not found
+      # Extract content between the tags
+      answer = text[start_idx + len(start_tag):].strip()
+      return answer
+  return get_answer(generated_text)
 # Create the Gradio interface
 demo = gr.Interface(
+    fn=generate_answer,
+    inputs=gr.Textbox(lines=5, label="Ask Question on AI/ML"),
+    outputs=gr.Textbox(label="G-15 Gemma7b Model Generated Answer")
 )
 demo.launch()