Spaces:

prithivMLmods
/

Florence-2-Image-Caption

Running

App Files Files Community

prithivMLmods commited on 13 days ago

Commit

c8f14aa

verified ·

1 Parent(s): 1522738

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -77

app.py CHANGED Viewed

@@ -1,73 +1,8 @@
-import os
 import subprocess
 import torch
 from PIL import Image
 from transformers import AutoProcessor, AutoModelForCausalLM
-import gradio as gr
-from gradio.themes import Soft
-from gradio.themes.utils import colors, fonts, sizes
-from typing import Iterable
-# --- Theme and CSS Definition ---
-colors.steel_blue = colors.Color(
-    name="steel_blue",
-    c50="#EBF3F8",
-    c100="#D3E5F0",
-    c200="#A8CCE1",
-    c300="#7DB3D2",
-    c400="#529AC3",
-    c500="#4682B4",  # SteelBlue base color
-    c600="#3E72A0",
-    c700="#36638C",
-    c800="#2E5378",
-    c900="#264364",
-    c950="#1E3450",
-)
-class SteelBlueTheme(Soft):
-    def __init__(
-        self,
-        *,
-        primary_hue: colors.Color | str = colors.gray,
-        secondary_hue: colors.Color | str = colors.steel_blue,
-        neutral_hue: colors.Color | str = colors.slate,
-        text_size: sizes.Size | str = sizes.text_lg,
-        font: fonts.Font | str | Iterable[fonts.Font | str] = (
-            fonts.GoogleFont("Outfit"), "Arial", "sans-serif",
-        ),
-        font_mono: fonts.Font | str | Iterable[fonts.Font | str] = (
-            fonts.GoogleFont("IBM Plex Mono"), "ui-monospace", "monospace",
-        ),
-    ):
-        super().__init__(
-            primary_hue=primary_hue,
-            secondary_hue=secondary_hue,
-            neutral_hue=neutral_hue,
-            text_size=text_size,
-            font=font,
-            font_mono=font_mono,
-        )
-        super().set(
-            body_background_fill="linear-gradient(135deg, *primary_100, *primary_200)",
-            body_background_fill_dark="linear-gradient(135deg, *primary_800, *primary_900)",
-            button_primary_background_fill="linear-gradient(90deg, *secondary_500, *secondary_600)",
-            button_primary_background_fill_hover="linear-gradient(90deg, *secondary_600, *secondary_700)",
-            button_primary_text_color="white",
-            slider_color="*secondary_500",
-            slider_color_dark="*secondary_600",
-            block_title_text_weight="600",
-            block_border_width="2px",
-            block_shadow="*shadow_drop_lg",
-            button_shadow="*shadow_drop_lg",
-            button_large_padding="12px",
-        )
-# Instantiate the theme
-steel_blue_theme = SteelBlueTheme()
-# --- Model and App Setup ---
 # Attempt to install flash-attn
 try:
@@ -100,6 +35,13 @@ except Exception as e:
 def describe_image(uploaded_image, model_choice):
     """
     Generates a detailed description of the input image using the selected model.
     """
     if uploaded_image is None:
         return "Please upload an image."
@@ -147,28 +89,37 @@ if device == "cpu":
 # Define examples
 examples = [
-    ["images/2.jpeg", "Florence-2-large"],
-    ["images/1.jpeg", "Florence-2-base"],
-    ["images/3.jpeg", "Florence-2-large"],
-    ["images/4.jpeg", "Florence-2-large"]
 ]
 # Create the Gradio interface with Blocks
-with gr.Blocks(theme=steel_blue_theme) as demo:
     gr.Markdown("# **Florence-2 Models Image Captions**")
     gr.Markdown(description)
     with gr.Row():
         # Left column: Input image and Generate button
-        with gr.Column(scale=2):
-            image_input = gr.Image(label="Upload Image", type="pil", height=350)
-            generate_btn = gr.Button("Generate Caption", variant="primary")
             gr.Examples(examples=examples, inputs=[image_input])
         # Right column: Model choice, output, and examples
-        with gr.Column(scale=3):
             model_choice = gr.Radio(["Florence-2-base", "Florence-2-large"], label="Model Choice", value="Florence-2-base")
-            output = gr.Textbox(label="Generated Caption", lines=10, show_copy_button=True)
     # Connect the button to the function
     generate_btn.click(fn=describe_image, inputs=[image_input, model_choice], outputs=output)

+import gradio as gr
 import subprocess
 import torch
 from PIL import Image
 from transformers import AutoProcessor, AutoModelForCausalLM
 # Attempt to install flash-attn
 try:
 def describe_image(uploaded_image, model_choice):
     """
     Generates a detailed description of the input image using the selected model.
+    Args:
+        uploaded_image (PIL.Image.Image): The image to describe.
+        model_choice (str): The model to use, either "Base" or "Large".
+    Returns:
+        str: A detailed textual description of the image or an error message.
     """
     if uploaded_image is None:
         return "Please upload an image."
 # Define examples
 examples = [
+    ["images/2.png", "Florence-2-large"],
+    ["images/1.png", "Florence-2-base"],
+    ["images/3.png", "Florence-2-large"],
+    ["images/4.png", "Florence-2-large"]
 ]
+css = """
+.submit-btn {
+    background-color: #4682B4 !important;
+    color: white !important;
+}
+.submit-btn:hover {
+    background-color: #87CEEB !important;
+}
+"""
 # Create the Gradio interface with Blocks
+with gr.Blocks(theme="bethecloud/storj_theme", css=css) as demo:
     gr.Markdown("# **Florence-2 Models Image Captions**")
     gr.Markdown(description)
     with gr.Row():
         # Left column: Input image and Generate button
+        with gr.Column():
+            image_input = gr.Image(label="Upload Image", type="pil")
+            generate_btn = gr.Button("Generate Caption", elem_classes="submit-btn")
             gr.Examples(examples=examples, inputs=[image_input])
         # Right column: Model choice, output, and examples
+        with gr.Column():
             model_choice = gr.Radio(["Florence-2-base", "Florence-2-large"], label="Model Choice", value="Florence-2-base")
+            with gr.Row():
+                output = gr.Textbox(label="Generated Caption", lines=4, show_copy_button=True)
     # Connect the button to the function
     generate_btn.click(fn=describe_image, inputs=[image_input, model_choice], outputs=output)