Spaces:
Sleeping
Sleeping
Revert "paddleocr"
Browse filesThis reverts commit f6e9138688ef632268208c2a6b0fb4ae7c5924fc.
- Dockerfile +1 -2
- main.py +19 -16
- requirements.txt +0 -0
Dockerfile
CHANGED
@@ -1,11 +1,10 @@
|
|
1 |
FROM python:3.12.1
|
2 |
|
3 |
ENV HF_HOME /tmp
|
4 |
-
ENV HOME /tmp
|
5 |
|
6 |
WORKDIR /code
|
7 |
|
8 |
-
RUN apt-get update && apt-get install -y libgl1-mesa-glx libboost-thread1.74.0
|
9 |
|
10 |
|
11 |
|
|
|
1 |
FROM python:3.12.1
|
2 |
|
3 |
ENV HF_HOME /tmp
|
|
|
4 |
|
5 |
WORKDIR /code
|
6 |
|
7 |
+
RUN apt-get update && apt-get install -y libgl1-mesa-glx libboost-thread1.74.0 && rm -rf /var/lib/apt/lists/*
|
8 |
|
9 |
|
10 |
|
main.py
CHANGED
@@ -6,11 +6,11 @@ from datetime import datetime
|
|
6 |
from typing import List
|
7 |
|
8 |
import cv2
|
|
|
9 |
import numpy as np
|
10 |
from fastapi import FastAPI, HTTPException, Request, UploadFile
|
11 |
from fastapi.middleware.cors import CORSMiddleware
|
12 |
from fastapi.responses import JSONResponse
|
13 |
-
from paddleocr import PaddleOCR
|
14 |
from PIL import Image
|
15 |
|
16 |
import dds
|
@@ -62,18 +62,18 @@ def load_ocr_model():
|
|
62 |
グローバル変数readerに格納する。
|
63 |
"""
|
64 |
global reader
|
65 |
-
|
66 |
-
|
67 |
|
68 |
# 使用する言語と、モデルの保存先ディレクトリを指定してReaderを初期化
|
69 |
-
|
70 |
-
|
71 |
-
|
72 |
-
|
73 |
-
|
74 |
-
|
75 |
-
|
76 |
-
|
77 |
|
78 |
|
79 |
# @app.on_event("startup")
|
@@ -213,11 +213,14 @@ async def analyze_image(image_paths: list[UploadFile]):
|
|
213 |
# img = Image.fromarray(
|
214 |
# cv2.cvtColor(candidate["img"], cv2.COLOR_BGR2RGB)
|
215 |
# )
|
|
|
|
|
|
|
216 |
|
217 |
-
result = reader.
|
218 |
-
|
219 |
-
|
220 |
-
|
221 |
print(result)
|
222 |
if len(result) > 0:
|
223 |
ocr_results.append(result)
|
@@ -239,7 +242,7 @@ async def analyze_image(image_paths: list[UploadFile]):
|
|
239 |
# reds = []
|
240 |
for i, result in enumerate(ocr_results):
|
241 |
# text = result[0]["generated_text"].upper().strip()
|
242 |
-
text = result[0]
|
243 |
print(text, is_text_valid(text))
|
244 |
|
245 |
text = is_text_valid(text)
|
|
|
6 |
from typing import List
|
7 |
|
8 |
import cv2
|
9 |
+
import easyocr
|
10 |
import numpy as np
|
11 |
from fastapi import FastAPI, HTTPException, Request, UploadFile
|
12 |
from fastapi.middleware.cors import CORSMiddleware
|
13 |
from fastapi.responses import JSONResponse
|
|
|
14 |
from PIL import Image
|
15 |
|
16 |
import dds
|
|
|
62 |
グローバル変数readerに格納する。
|
63 |
"""
|
64 |
global reader
|
65 |
+
model_dir = "/tmp/easyocr_models"
|
66 |
+
network_dir = "/tmp/easyocr_models/network"
|
67 |
|
68 |
# 使用する言語と、モデルの保存先ディレクトリを指定してReaderを初期化
|
69 |
+
reader = easyocr.Reader(
|
70 |
+
["en"],
|
71 |
+
model_storage_directory=model_dir,
|
72 |
+
user_network_directory=network_dir,
|
73 |
+
)
|
74 |
+
print(
|
75 |
+
f"EasyOCR model loaded successfully. Models are stored in {model_dir}"
|
76 |
+
)
|
77 |
|
78 |
|
79 |
# @app.on_event("startup")
|
|
|
213 |
# img = Image.fromarray(
|
214 |
# cv2.cvtColor(candidate["img"], cv2.COLOR_BGR2RGB)
|
215 |
# )
|
216 |
+
custom_config = (
|
217 |
+
r"--psm 10 -c tessedit_char_whitelist=0123456789AKQJ"
|
218 |
+
)
|
219 |
|
220 |
+
# result = reader.readtext(candidate["img"])
|
221 |
+
result = reader.readtext(
|
222 |
+
candidate["img"], text_threshold=0.4
|
223 |
+
)
|
224 |
print(result)
|
225 |
if len(result) > 0:
|
226 |
ocr_results.append(result)
|
|
|
242 |
# reds = []
|
243 |
for i, result in enumerate(ocr_results):
|
244 |
# text = result[0]["generated_text"].upper().strip()
|
245 |
+
_, text, _ = result[0]
|
246 |
print(text, is_text_valid(text))
|
247 |
|
248 |
text = is_text_valid(text)
|
requirements.txt
CHANGED
Binary files a/requirements.txt and b/requirements.txt differ
|
|