whisper-jax-yt-summary

Build error

App Files Files Community

ohmygod0193 commited on Nov 26, 2023

Commit

ba125ce

1 Parent(s): 8fe73ad

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -28

app.py CHANGED Viewed

@@ -141,19 +141,19 @@ def summarize_text(title,text,temperature,words,use_api=False,api_token=None,do_
         summary_source = 'The summary was generated using {} hosted locally.'.format(llm_model_id)
-    # Map
     map_template = """
-    You are an intelligent AI assistant that is tasked to review the content of a video and provide a concise and accurate summary.\n
-    You do not provide information that is not mentioned in the video. You only provide information that you are absolutely sure about.\n
-    Reply with the language same as the title.\n
-    Summarize the following text in a clear and concise way:\n
     ----------------------- \n
     TITLE: `{title}`\n
     TEXT:\n
-    `{docs}`\n
     ----------------------- \n
-    BRIEF SUMMARY:\n
     """
     map_prompt = PromptTemplate(
         template = map_template,
         input_variables = ['title','docs']
@@ -162,19 +162,17 @@ def summarize_text(title,text,temperature,words,use_api=False,api_token=None,do_
     # Reduce - Collapse
     collapse_template = """
-    You are an intelligent AI assistant that is tasked to review the content of a video and provide a concise and accurate summary.\n
-    You do not provide information that is not mentioned in the video. You only provide information that you are absolutely sure about.\n
-    Reply with the language same as the title.\n
-    The following is set of partial summaries of a video:\n
     ----------------------- \n
     TITLE: `{title}`\n
     PARTIAL SUMMARIES:\n
     `{doc_summaries}`\n
     ----------------------- \n
-    Take these and distill them into a consolidated summary.\n
-    SUMMARY:\n
     """
     collapse_prompt = PromptTemplate(
         template = collapse_template,
         input_variables = ['title','doc_summaries']
@@ -187,18 +185,17 @@ def summarize_text(title,text,temperature,words,use_api=False,api_token=None,do_
         )
     # Final Reduce - Combine
-    combine_template = """\n
-    You are an intelligent AI assistant that is tasked to review the content of a video and provide a concise and accurate summary.\n
-    You do not provide information that is not mentioned in the video. You only provide information that you are absolutely sure about.\n
-    The following is a set of partial summaries of a video:\n
     ----------------------- \n
     TITLE: `{title}`\n
     PARTIAL SUMMARIES:\n
     `{doc_summaries}`\n
     ----------------------- \n
-    Generate an executive summary of the whole text in maximum {words} words that contains the main messages, points, and arguments presented in the video as bullet points. Avoid duplications or redundant information. \n
     EXECUTIVE SUMMARY:\n
     """
     combine_prompt = PromptTemplate(
         template = combine_template,
         input_variables = ['title','doc_summaries','words']
@@ -271,7 +268,7 @@ def summarize_youtube_video(url,force_transcribe,api_token="",
     if api_token == "":
         api_token = HF_TOKEN
     title,text,transcript_source = transcribe_youtube_video(url,force_transcribe,True,api_token)
-    print("Transcript:",text[:500])
     summary, summary_source = summarize_text(title,text,temperature,words,True,api_token,do_sample)
     print("Summary:",summary)
     return summary, text, transcript_source, summary_source
@@ -298,9 +295,7 @@ with gr.Blocks() as demo:
     with gr.Row():
         with gr.Column(scale=4):
             url = gr.Textbox(label="Enter YouTube video URL here:",placeholder="https://www.youtube.com/watch?v=",info="The video must not be age-restricted. Otherwise, the transcription will fail. The demo supports videos in English language only.")
-        with gr.Column(scale=1):
-            api_token = gr.Textbox(label="Paste your Hugging Face API token here (Optional):",placeholder="hf_...",visible=True,show_label=True,info='The API token passed via this field is not stored. It is only passed through the Hugging Face Hub API for inference.')
-        with gr.Column(scale=1):
             sum_btn = gr.Button("Summarize!")
             gr.Markdown("## Please like the repo if you find this helpful.")
@@ -330,14 +325,16 @@ with gr.Blocks() as demo:
         with gr.Group():
             transcript = gr.Textbox(label="Full Transcript",placeholder="transcript...",show_label=True)
             transcript_source = gr.Textbox(visible=False)
-    with gr.Accordion("# Acknoledgement",open=True):
         gr.Markdown("""
-                    ## Thank you for open source code from [smakamali](https://huggingface.co/smakamali) and [Sanchit Gandhi](https://huggingface.co/sanchit-gandhi)\n
-                    1. Most part of the code is duplicate from https://huggingface.co/spaces/smakamali/summarize_youtube. And thank you for smakamali's code\n
-                    Detailed instructions for recreating this tool are provided [here](https://pub.towardsai.net/a-complete-guide-for-creating-an-ai-assistant-for-summarizing-youtube-videos-part-1-32fbadabc2cc?sk=34269402931178039c4c3589df4a6ec5) and [here](https://pub.towardsai.net/a-complete-guide-for-creating-an-ai-assistant-for-summarizing-youtube-videos-part-2-a008ee18f341?sk=d59046b36a52c74dfa8befa99183e5b6)."
-                    2. I also call the api from https://sanchit-gandhi-whisper-jax.hf.space/\n
                     """)
-    with gr.Accordion("# Disclaimer",open=False):
         gr.Markdown("""
                     1. This app attempts to download the transcript from Youtube first. If the transcript is not available, or the prompts require, the video will be transcribed.\n
                     2. The app performs best on videos in which the number of speakers is limited or when the YouTube transcript includes annotations of the speakers.\n

         summary_source = 'The summary was generated using {} hosted locally.'.format(llm_model_id)
+    # Map templates
     map_template = """
+    As an AI tasked with summarizing a video, your objective is to distill the key insights without introducing new information. This prompt aims to provide a concise summary.\n
     ----------------------- \n
     TITLE: `{title}`\n
     TEXT:\n
+    `{docs}`\n
     ----------------------- \n
+    Summarize the provided content, emphasizing main points, key arguments, and relevant details. Keep the summary clear and succinct.\n
+    SUMMARY:\n
     """
     map_prompt = PromptTemplate(
         template = map_template,
         input_variables = ['title','docs']
     # Reduce - Collapse
     collapse_template = """
+    As an AI tasked with combining partial summaries, your goal is to create a cohesive, comprehensive summary without duplications.\n
     ----------------------- \n
     TITLE: `{title}`\n
     PARTIAL SUMMARIES:\n
     `{doc_summaries}`\n
     ----------------------- \n
+    Synthesize the information from the partial summaries into a consolidated, coherent summary. Ensure that the final summary covers all essential points without repeating redundant information.\n
+    CONSOLIDATED SUMMARY:\n
     """
     collapse_prompt = PromptTemplate(
         template = collapse_template,
         input_variables = ['title','doc_summaries']
         )
     # Final Reduce - Combine
+    combine_template = """
+    As an AI tasked with summarizing a video, your goal is to distill the main insights without introducing new information. This prompt aims to generate a concise executive summary.\n
     ----------------------- \n
     TITLE: `{title}`\n
     PARTIAL SUMMARIES:\n
     `{doc_summaries}`\n
     ----------------------- \n
+    Extract the most critical information from the partial summaries provided. Craft an executive summary in {words} words, focusing on the main arguments, key takeaways, and supporting evidence presented in the video. Aim for clarity, brevity, and avoid repeating redundant points. Ensure the summary encapsulates the essence of the content.\n
     EXECUTIVE SUMMARY:\n
     """
     combine_prompt = PromptTemplate(
         template = combine_template,
         input_variables = ['title','doc_summaries','words']
     if api_token == "":
         api_token = HF_TOKEN
     title,text,transcript_source = transcribe_youtube_video(url,force_transcribe,True,api_token)
+    print("Transcript:",text)
     summary, summary_source = summarize_text(title,text,temperature,words,True,api_token,do_sample)
     print("Summary:",summary)
     return summary, text, transcript_source, summary_source
     with gr.Row():
         with gr.Column(scale=4):
             url = gr.Textbox(label="Enter YouTube video URL here:",placeholder="https://www.youtube.com/watch?v=",info="The video must not be age-restricted. Otherwise, the transcription will fail. The demo supports videos in English language only.")
+        with gr.Column(scale=2):
             sum_btn = gr.Button("Summarize!")
             gr.Markdown("## Please like the repo if you find this helpful.")
         with gr.Group():
             transcript = gr.Textbox(label="Full Transcript",placeholder="transcript...",show_label=True)
             transcript_source = gr.Textbox(visible=False)
+    with gr.Accordion("Acknoledgement",open=True):
         gr.Markdown("""
+                    I sincerely appreciate the open source tools shared by [smakamali](https://huggingface.co/smakamali) (summary_method) and [Sanchit Gandhi](https://huggingface.co/sanchit-gandhi) (Whisper-Jax API)
+                    which were instrumental in developing this project. Their publicly available innovations in AI model training and speech recognition directly enabled key capabilities. Please view their exceptional repositories on HuggingFace for additional details.\n
+                    [summarize_youtube](https://huggingface.co/spaces/smakamali/summarize_youtube)\n
+                    Detailed instructions for recreating this tool are provided [here](https://pub.towardsai.net/a-complete-guide-for-creating-an-ai-assistant-for-summarizing-youtube-videos-part-1-32fbadabc2cc?sk=34269402931178039c4c3589df4a6ec5) and [here](https://pub.towardsai.net/a-complete-guide-for-creating-an-ai-assistant-for-summarizing-youtube-videos-part-2-a008ee18f341?sk=d59046b36a52c74dfa8befa99183e5b6).\n
+                    [Whisper-Jax-api](https://sanchit-gandhi-whisper-jax.hf.space/)\n
                     """)
+    with gr.Accordion("Disclaimer",open=False):
         gr.Markdown("""
                     1. This app attempts to download the transcript from Youtube first. If the transcript is not available, or the prompts require, the video will be transcribed.\n
                     2. The app performs best on videos in which the number of speakers is limited or when the YouTube transcript includes annotations of the speakers.\n