Spaces:

Zoe911
/

OCR-C

Sleeping

App Files Files Community

Zoe911 commited on Apr 2

Commit

c2c00e6

verified ·

1 Parent(s): 4875ce9

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -21

app.py CHANGED Viewed

@@ -4,33 +4,33 @@ from PIL import Image
 import numpy as np
 import re
-# 初始化OCR模型
 ocr = PaddleOCR(use_angle_cls=True, lang="en")
 def ocr_recognition(image):
     try:
-        # 确保使用PIL
         if isinstance(image, np.ndarray):
             image = Image.fromarray(image)
         if not isinstance(image, Image.Image):
             return "Invalid image format"
-        # 转换为numpy数组
         image_np = np.array(image)
-        # 执行OCR识别
         result = ocr.ocr(image_np, cls=True)
         if not result or len(result) == 0 or result[0] is None:
             return "No text recognized"
-        # 提取文本
         texts = [line[1][0] for line in result[0] if line]
         if not texts:
             return "No text recognized"
-        # 解析文本以提取结构化信息
         structured_info = parse_text_to_structure(texts)
         return structured_info
@@ -38,7 +38,7 @@ def ocr_recognition(image):
         return f"Error processing image: {str(e)}"
 def parse_text_to_structure(texts):
-    # 初始化结构化字段
     structured_data = {
         "Event": "",
         "Location": "",
@@ -48,11 +48,11 @@ def parse_text_to_structure(texts):
         "Date": ""
     }
-    # 合并所有文本
     full_text = " ".join(texts)
-    # 尝试使用正则表达式匹配各个字段
-    # 这些模式需要根据您的实际文档格式进行调整
     event_pattern = re.search(r"(?:Event|Title):\s*(.+?)(?=\s*(?:Location|Venue|Date|Start|End|Duration)|$)", full_text, re.I)
     if event_pattern:
         structured_data["Event"] = event_pattern.group(1).strip()
@@ -77,29 +77,29 @@ def parse_text_to_structure(texts):
     if duration_pattern:
         structured_data["Duration"] = duration_pattern.group(1).strip()
-    # 如果没有找到明确的持续时间，但有开始和结束时间，可以尝试计算
     if structured_data["Duration"] == "" and structured_data["Start Time"] and structured_data["End Time"]:
-        # 这里需要更复杂的时间计算逻辑，简单起见暂时略过
         pass
-    # 格式化输出
     output = "\n".join([f"{key}: {value}" for key, value in structured_data.items() if value])
-    # 如果没有提取到任何结构化信息，返回原始文本
     if not output:
-        return "未能提取结构化信息。原始文本:\n" + "\n".join(texts)
     return output
-# 创建Gradio界面
 interface = gr.Interface(
     fn=ocr_recognition,
-    inputs=gr.Image(type="pil"),  # 明确指定使用PIL
     outputs="text",
-    title="结构化OCR识别",
-    description="上传图片进行文本识别，并提取事件、地点、时间等结构化信息"
 )
-# 启动服务
 if __name__ == "__main__":
-    interface.launch()

 import numpy as np
 import re
+# Initialize OCR model
 ocr = PaddleOCR(use_angle_cls=True, lang="en")
 def ocr_recognition(image):
     try:
+        # Ensure using PIL
         if isinstance(image, np.ndarray):
             image = Image.fromarray(image)
         if not isinstance(image, Image.Image):
             return "Invalid image format"
+        # Convert to numpy array
         image_np = np.array(image)
+        # Perform OCR recognition
         result = ocr.ocr(image_np, cls=True)
         if not result or len(result) == 0 or result[0] is None:
             return "No text recognized"
+        # Extract text
         texts = [line[1][0] for line in result[0] if line]
         if not texts:
             return "No text recognized"
+        # Parse text to extract structured information
         structured_info = parse_text_to_structure(texts)
         return structured_info
         return f"Error processing image: {str(e)}"
 def parse_text_to_structure(texts):
+    # Initialize structured fields
     structured_data = {
         "Event": "",
         "Location": "",
         "Date": ""
     }
+    # Merge all text
     full_text = " ".join(texts)
+    # Try to match each field using regex
+    # These patterns should be adjusted according to your actual document format
     event_pattern = re.search(r"(?:Event|Title):\s*(.+?)(?=\s*(?:Location|Venue|Date|Start|End|Duration)|$)", full_text, re.I)
     if event_pattern:
         structured_data["Event"] = event_pattern.group(1).strip()
     if duration_pattern:
         structured_data["Duration"] = duration_pattern.group(1).strip()
+    # If no explicit duration is found but we have start and end times, we could calculate it
     if structured_data["Duration"] == "" and structured_data["Start Time"] and structured_data["End Time"]:
+        # More complex time calculation logic would be needed here
         pass
+    # Format output
     output = "\n".join([f"{key}: {value}" for key, value in structured_data.items() if value])
+    # If no structured information was extracted, return the original text
     if not output:
+        return "\n".join(texts)
     return output
+# Create Gradio interface
 interface = gr.Interface(
     fn=ocr_recognition,
+    inputs=gr.Image(type="pil"),  # Explicitly specify using PIL
     outputs="text",
+    title="Structured OCR Recognition",
+    description="Upload an image for text recognition and extraction of structured information"
 )
+# Launch the service
 if __name__ == "__main__":
+    interface.launch()