Spaces:

imperiusrex
/

Handwritten_OCR

Sleeping

App Files Files Community

imperiusrex commited on Jul 31

Commit

1ae4d91

verified ·

1 Parent(s): 0400c24

Update app.py

Browse files

Files changed (1) hide show

app.py +44 -2

app.py CHANGED Viewed

@@ -30,7 +30,6 @@ print(f"Using device: {device}")
 # Initialize the PaddleOCR detection model
 print("Initializing PaddleOCR text detection model...")
 try:
-    # Use the PaddleOCR class with a specific model for detection only
     det_model = PaddleOCR(use_angle_cls=False, lang='en', use_gpu=torch.cuda.is_available(), show_log=False)
 except Exception as e:
     print(f"Error initializing PaddleOCR: {e}")
@@ -204,4 +203,47 @@ def process_file_and_create_pdf(file):
             temp_img_path = os.path.join(temp_output_dir, "original_image.png")
             original_image.save(temp_img_path)
-            c.drawImage(temp_img_path, 50, height - 300, width=200, preserveAspectRatio=T

 # Initialize the PaddleOCR detection model
 print("Initializing PaddleOCR text detection model...")
 try:
     det_model = PaddleOCR(use_angle_cls=False, lang='en', use_gpu=torch.cuda.is_available(), show_log=False)
 except Exception as e:
     print(f"Error initializing PaddleOCR: {e}")
             temp_img_path = os.path.join(temp_output_dir, "original_image.png")
             original_image.save(temp_img_path)
+            # Corrected the typo: `T` changed to `True`
+            c.drawImage(temp_img_path, 50, height - 300, width=200, preserveAspectRatio=True)
+            os.remove(temp_img_path)
+            y = height - 350
+            c.setFont("Helvetica", 12)
+            for _, text in results:
+                c.drawString(50, y, text)
+                y -= 15
+                if y < 50:
+                    c.showPage()
+                    c.setFont("Helvetica", 12)
+                    y = height - 50
+            c.save()
+        return output_pdf_path, input_image_for_display
+    except Exception as e:
+        print(f"An error occurred: {e}")
+        if os.path.exists(temp_output_dir):
+            shutil.rmtree(temp_output_dir)
+        return None, None
+# Gradio Interface
+@GPU
+def process_file_for_gradio(file):
+    output_path, input_image = process_file_and_create_pdf(file)
+    if output_path is None:
+        return None, None
+    return output_path, input_image
+demo = gr.Interface(
+    fn=process_file_for_gradio,
+    inputs=gr.File(label="Upload an Image (PNG, JPG) or a PDF", file_types=['.png', '.jpg', '.jpeg', '.pdf']),
+    outputs=[
+        gr.File(label="Download OCR Results PDF", interactive=False, visible=True),
+        gr.Image(label="Uploaded Image Preview", interactive=False)
+    ],
+    title="OCR App with PaddleOCR and TrOCR",
+    description="Upload an image or a multi-page PDF to get an output PDF with the recognized text from each page. The output PDF will be downloaded automatically.",
+)
+if __name__ == "__main__":
+    demo.launch()