Spaces:

ARCQUB
/

BPMN-entity-extractor

Sleeping

App Files Files Community

ARCQUB commited on 23 days ago

Commit

5397ce0

verified ·

1 Parent(s): 33ad5cc

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -18

app.py CHANGED Viewed

@@ -2,10 +2,20 @@ import gradio as gr
 import importlib
 from PIL import Image
 import json
-import os
-# === Load the GPT-4o module only
-from models import gpt4o_pix2struct_ocr
 # === Format Raw JSON Output
 def format_result_json(output):
@@ -128,12 +138,15 @@ def format_pretty_view(output):
     return "\n".join(lines).strip()
-# === Inference Handler (GPT-4o only)
-def process_image(image_file):
     image = Image.open(image_file.name).convert("RGB")
-    result = gpt4o_pix2struct_ocr.run_model(image)
     parsed_json = result.get("json")
-    raw_text = result.get("raw")
     if parsed_json:
         json_output = format_result_json(parsed_json)
@@ -144,23 +157,27 @@ def process_image(image_file):
     return image, json_output, pretty_output
-# === Gradio Interface
 iface = gr.Interface(
-    fn=process_image,
-    inputs=[gr.File(file_types=["image"], label="Upload a BPMN Diagram Image")],
     outputs=[
-        gr.Image(label="📷 Input Image"),
-        gr.Textbox(label="🧠 Raw JSON Output", lines=20),
-        gr.Textbox(label="📋 Prettified View", lines=25)
     ],
-    title="🧩 BPMN Extractor using GPT-4o + OCR",
-    description="Upload a BPMN diagram image. Extracts structured JSON using GPT-4o and Pix2Struct OCR. Runs on CPU-only Space.",
-    allow_flagging="never"
 )
-# === Launch without GPU
 def main():
-    iface.launch(ssr=False)
 if __name__ == "__main__":
     main()

 import importlib
 from PIL import Image
 import json
+import spaces
+# === Model Mapping ===
+MODEL_MAP = {
+    #"Qwen": "models.qwen",
+    #"Pixtral": "models.pixtral",
+    #"Aya Vision": "models.aya_vision",
+    "GPT-4o": "models.gpt4o"
+}
+# === Load Model
+def load_model_runner(model_name):
+    module = importlib.import_module(MODEL_MAP[model_name])
+    return module.run_model
 # === Format Raw JSON Output
 def format_result_json(output):
     return "\n".join(lines).strip()
+# === Main Inference Handler
+def process_single_image(model_name, image_file):
+    runner = load_model_runner(model_name)
     image = Image.open(image_file.name).convert("RGB")
+    result = runner(image)
     parsed_json = result.get("json")
+    raw_text = result.get("raw", "")
     if parsed_json:
         json_output = format_result_json(parsed_json)
     return image, json_output, pretty_output
+# === Gradio UI
 iface = gr.Interface(
+    fn=process_single_image,
+    inputs=[
+        gr.Dropdown(choices=list(MODEL_MAP.keys()), label="Select Vision Model"),
+        gr.File(file_types=["image"], label="Upload a BPMN Image")
+    ],
     outputs=[
+        gr.Image(label="Input Image"),
+        gr.Textbox(label="Raw JSON Output (Technical)", lines=20),
+        gr.Textbox(label="Prettified View (User-Friendly)", lines=25)
     ],
+    title="🖼️ Vision Model Extractor - JSON + Pretty View",
+    description="Upload a BPMN image and select a vision model to extract structured output. GPT-4o uses an API key from your Hugging Face Space Secret.",
+    flagging_mode="never"
 )
+# === Enable GPU mode and launch
+#@spaces.GPU
 def main():
+    iface.launch()
 if __name__ == "__main__":
     main()