Spaces:

yeswanthvarma
/

answer-evaluation-app

Running

App Files Files Community

yeswanthvarma commited on Jun 26

Commit

1a1c667

verified ·

1 Parent(s): 23fad62

Update utils/image_processor.py

Browse files

Files changed (1) hide show

utils/image_processor.py +38 -35

utils/image_processor.py CHANGED Viewed

@@ -1,58 +1,61 @@
-import torch
 import cv2
-from transformers import TrOCRProcessor, VisionEncoderDecoderModel
 from PIL import Image
-import os
-# Load processor and model only once
 try:
     processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-handwritten")
     model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-handwritten")
-    model.to("cpu")  # You can set to "cuda" if running with GPU
-    print("✅ TrOCR model loaded successfully.")
-    ocr_available = True
 except Exception as e:
-    print(f"❌ TrOCR initialization failed: {str(e)}")
-    ocr_available = False
 def extract_text_from_image(image_path):
     """
-    Extract text from an image file using EasyOCR or TrOCR (if integrated).
     """
     try:
         print(f"📂 Reading image from: {image_path}")
-        if not ocr_available:
-            raise ValueError("EasyOCR is not available")
         image = cv2.imread(image_path)
         if image is None:
-            raise ValueError(f"Could not read image at {image_path}")
-        processed_image = preprocess_image(image)
-        temp_path = os.path.join(os.path.dirname(image_path), f"temp_{os.path.basename(image_path)}")
-        cv2.imwrite(temp_path, processed_image)
-        results = reader.readtext(temp_path)
-        try:
-            os.remove(temp_path)
-        except:
-            pass
-        text = ' '.join([result[1] for result in results]).strip()
-        if not text:
-            results = reader.readtext(image_path)
-            text = ' '.join([result[1] for result in results]).strip()
-        # ✅ Log extracted text
-        print(f"📝 Extracted text from {os.path.basename(image_path)}:\n{text}\n")
-        return text or "Text extraction failed. Please enter text manually."
     except Exception as e:
-        print(f"OCR failed: {str(e)}")
         return "Text extraction failed. Please enter text manually."

+import os
 import cv2
+import numpy as np
 from PIL import Image
+import torch
+from transformers import TrOCRProcessor, VisionEncoderDecoderModel
+# ✅ Load TrOCR model and processor once
 try:
     processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-handwritten")
     model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-handwritten")
+    model.eval()
+    print("✅ TrOCR model loaded.")
+    trocr_available = True
 except Exception as e:
+    print(f"❌ Failed to load TrOCR: {e}")
+    trocr_available = False
+def preprocess_image(image):
+    """
+    Preprocess image for OCR: convert to grayscale and enhance contrast.
+    """
+    gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+    denoised = cv2.fastNlMeansDenoising(gray, h=10)
+    processed = cv2.adaptiveThreshold(
+        denoised, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
+        cv2.THRESH_BINARY, 11, 2
+    )
+    return processed
 def extract_text_from_image(image_path):
     """
+    Extract text using TrOCR from a handwritten image
     """
     try:
+        if not trocr_available:
+            raise ValueError("TrOCR is not available.")
         print(f"📂 Reading image from: {image_path}")
+        # Read and preprocess image
         image = cv2.imread(image_path)
         if image is None:
+            raise ValueError(f"Could not load image: {image_path}")
+        processed_image = preprocess_image(image)
+        pil_image = Image.fromarray(processed_image).convert("RGB")
+        # TrOCR expects pixel values between 0-1
+        pixel_values = processor(images=pil_image, return_tensors="pt").pixel_values
+        # Disable gradient for inference
+        with torch.no_grad():
+            generated_ids = model.generate(pixel_values)
+            generated_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
+        return generated_text.strip() or "Text extraction failed. Please enter text manually."
     except Exception as e:
+        print(f"OCR failed: {e}")
         return "Text extraction failed. Please enter text manually."