wai572 commited on
Commit
11cc1d4
·
1 Parent(s): 905660e

Revert "paddleocr"

Browse files

This reverts commit f6e9138688ef632268208c2a6b0fb4ae7c5924fc.

Files changed (3) hide show
  1. Dockerfile +1 -2
  2. main.py +19 -16
  3. requirements.txt +0 -0
Dockerfile CHANGED
@@ -1,11 +1,10 @@
1
  FROM python:3.12.1
2
 
3
  ENV HF_HOME /tmp
4
- ENV HOME /tmp
5
 
6
  WORKDIR /code
7
 
8
- RUN apt-get update && apt-get install -y libgl1-mesa-glx libboost-thread1.74.0 libxext6 fonts-freefont-ttf && rm -rf /var/lib/apt/lists/*
9
 
10
 
11
 
 
1
  FROM python:3.12.1
2
 
3
  ENV HF_HOME /tmp
 
4
 
5
  WORKDIR /code
6
 
7
+ RUN apt-get update && apt-get install -y libgl1-mesa-glx libboost-thread1.74.0 && rm -rf /var/lib/apt/lists/*
8
 
9
 
10
 
main.py CHANGED
@@ -6,11 +6,11 @@ from datetime import datetime
6
  from typing import List
7
 
8
  import cv2
 
9
  import numpy as np
10
  from fastapi import FastAPI, HTTPException, Request, UploadFile
11
  from fastapi.middleware.cors import CORSMiddleware
12
  from fastapi.responses import JSONResponse
13
- from paddleocr import PaddleOCR
14
  from PIL import Image
15
 
16
  import dds
@@ -62,18 +62,18 @@ def load_ocr_model():
62
  グローバル変数readerに格納する。
63
  """
64
  global reader
65
- # model_dir = "/tmp/easyocr_models"
66
- # network_dir = "/tmp/easyocr_models/network"
67
 
68
  # 使用する言語と、モデルの保存先ディレクトリを指定してReaderを初期化
69
- # reader = easyocr.Reader(
70
- # ["en"],
71
- # model_storage_directory=model_dir,
72
- # user_network_directory=network_dir,
73
- # )
74
-
75
- reader = PaddleOCR(use_angle_cls=True, lang="en", show_log=False)
76
- print("PaddleOCR model loaded successfully.")
77
 
78
 
79
  # @app.on_event("startup")
@@ -213,11 +213,14 @@ async def analyze_image(image_paths: list[UploadFile]):
213
  # img = Image.fromarray(
214
  # cv2.cvtColor(candidate["img"], cv2.COLOR_BGR2RGB)
215
  # )
 
 
 
216
 
217
- result = reader.ocr(candidate["img"], cls=True)
218
- # result = reader.readtext(
219
- # candidate["img"], text_threshold=0.4
220
- # )
221
  print(result)
222
  if len(result) > 0:
223
  ocr_results.append(result)
@@ -239,7 +242,7 @@ async def analyze_image(image_paths: list[UploadFile]):
239
  # reds = []
240
  for i, result in enumerate(ocr_results):
241
  # text = result[0]["generated_text"].upper().strip()
242
- text = result[0][1][0]
243
  print(text, is_text_valid(text))
244
 
245
  text = is_text_valid(text)
 
6
  from typing import List
7
 
8
  import cv2
9
+ import easyocr
10
  import numpy as np
11
  from fastapi import FastAPI, HTTPException, Request, UploadFile
12
  from fastapi.middleware.cors import CORSMiddleware
13
  from fastapi.responses import JSONResponse
 
14
  from PIL import Image
15
 
16
  import dds
 
62
  グローバル変数readerに格納する。
63
  """
64
  global reader
65
+ model_dir = "/tmp/easyocr_models"
66
+ network_dir = "/tmp/easyocr_models/network"
67
 
68
  # 使用する言語と、モデルの保存先ディレクトリを指定してReaderを初期化
69
+ reader = easyocr.Reader(
70
+ ["en"],
71
+ model_storage_directory=model_dir,
72
+ user_network_directory=network_dir,
73
+ )
74
+ print(
75
+ f"EasyOCR model loaded successfully. Models are stored in {model_dir}"
76
+ )
77
 
78
 
79
  # @app.on_event("startup")
 
213
  # img = Image.fromarray(
214
  # cv2.cvtColor(candidate["img"], cv2.COLOR_BGR2RGB)
215
  # )
216
+ custom_config = (
217
+ r"--psm 10 -c tessedit_char_whitelist=0123456789AKQJ"
218
+ )
219
 
220
+ # result = reader.readtext(candidate["img"])
221
+ result = reader.readtext(
222
+ candidate["img"], text_threshold=0.4
223
+ )
224
  print(result)
225
  if len(result) > 0:
226
  ocr_results.append(result)
 
242
  # reds = []
243
  for i, result in enumerate(ocr_results):
244
  # text = result[0]["generated_text"].upper().strip()
245
+ _, text, _ = result[0]
246
  print(text, is_text_valid(text))
247
 
248
  text = is_text_valid(text)
requirements.txt CHANGED
Binary files a/requirements.txt and b/requirements.txt differ