项目初始化

2025-09-28 13:37:21 +08:00
commit 7795de3550
21 changed files with 364 additions and 0 deletions
--- a/.idea/.gitignore
+++ b/.idea/.gitignore
@@ -0,0 +1,8 @@
+# Default ignored files
+/shelf/
+/workspace.xml
+# Editor-based HTTP Client requests
+/httpRequests/
+# Datasource local storage ignored files
+/dataSources/
+/dataSources.local.xml
--- a/.idea/easyocr-api.iml
+++ b/.idea/easyocr-api.iml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<module type="PYTHON_MODULE" version="4">
+  <component name="NewModuleRootManager">
+    <content url="file://$MODULE_DIR$" />
+    <orderEntry type="inheritedJdk" />
+    <orderEntry type="sourceFolder" forTests="false" />
+  </component>
+</module>
--- a/.idea/inspectionProfiles/Project_Default.xml
+++ b/.idea/inspectionProfiles/Project_Default.xml
@@ -0,0 +1,41 @@
+<component name="InspectionProjectProfileManager">
+  <profile version="1.0">
+    <option name="myName" value="Project Default" />
+    <inspection_tool class="DuplicatedCode" enabled="true" level="WEAK WARNING" enabled_by_default="true">
+      <Languages>
+        <language minSize="130" name="Python" />
+      </Languages>
+    </inspection_tool>
+    <inspection_tool class="Eslint" enabled="true" level="WARNING" enabled_by_default="true" />
+    <inspection_tool class="PyPackageRequirementsInspection" enabled="true" level="WARNING" enabled_by_default="true">
+      <option name="ignoredPackages">
+        <value>
+          <list size="8">
+            <item index="0" class="java.lang.String" itemvalue="protobuf" />
+            <item index="1" class="java.lang.String" itemvalue="mkl-random" />
+            <item index="2" class="java.lang.String" itemvalue="numpy" />
+            <item index="3" class="java.lang.String" itemvalue="starlette" />
+            <item index="4" class="java.lang.String" itemvalue="charset-normalizer" />
+            <item index="5" class="java.lang.String" itemvalue="h11" />
+            <item index="6" class="java.lang.String" itemvalue="obs" />
+            <item index="7" class="java.lang.String" itemvalue="torch" />
+          </list>
+        </value>
+      </option>
+    </inspection_tool>
+    <inspection_tool class="PyPep8Inspection" enabled="true" level="WEAK WARNING" enabled_by_default="true">
+      <option name="ignoredErrors">
+        <list>
+          <option value="W292" />
+        </list>
+      </option>
+    </inspection_tool>
+    <inspection_tool class="PyPep8NamingInspection" enabled="true" level="WEAK WARNING" enabled_by_default="true">
+      <option name="ignoredErrors">
+        <list>
+          <option value="N803" />
+        </list>
+      </option>
+    </inspection_tool>
+  </profile>
+</component>
--- a/.idea/inspectionProfiles/profiles_settings.xml
+++ b/.idea/inspectionProfiles/profiles_settings.xml
@@ -0,0 +1,6 @@
+<component name="InspectionProjectProfileManager">
+  <settings>
+    <option name="USE_PROJECT_PROFILE" value="false" />
+    <version value="1.0" />
+  </settings>
+</component>
--- a/.idea/misc.xml
+++ b/.idea/misc.xml
@@ -0,0 +1,4 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="ProjectRootManager" version="2" project-jdk-name="Python 3.10 (easyocr)" project-jdk-type="Python SDK" />
+</project>
--- a/.idea/modules.xml
+++ b/.idea/modules.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="ProjectModuleManager">
+    <modules>
+      <module fileurl="file://$PROJECT_DIR$/.idea/easyocr-api.iml" filepath="$PROJECT_DIR$/.idea/easyocr-api.iml" />
+    </modules>
+  </component>
+</project>
--- a/.idea/vcs.xml
+++ b/.idea/vcs.xml
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="VcsDirectoryMappings">
+    <mapping directory="$PROJECT_DIR$" vcs="Git" />
+  </component>
+</project>
--- a/README.md
+++ b/README.md
@@ -0,0 +1 @@
+ocr demo,里面有两个模型 一个是easyocr，一个是百度的paddleocr
--- a/api/init.py
+++ b/api/init.py
--- a/api/easy_orc_api.py
+++ b/api/easy_orc_api.py
@@ -0,0 +1,61 @@
+import os
+import cv2
+import easyocr
+import numpy as np
+from core.response import SuccessResponse
+from fastapi import APIRouter, UploadFile, Form
+from schemas.orc_result import ResultInfo, ResultMain
+
+
+app = APIRouter()
+
+BASE_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+model_dir = os.path.join(BASE_DIR, 'model')
+
+reader = easyocr.Reader(
+    ['ch_sim', 'en'],
+    model_storage_directory=model_dir,
+    download_enabled=False,
+    gpu=True)
+
+
+def preprocess_img(image):
+    # 转为灰度图
+    gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+    # 二值化
+    _, binary = cv2.threshold(gray, 150, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU)
+    # 去噪声
+    denoised = cv2.medianBlur(binary, 3)
+    return denoised
+
+
+@app.post("/upload")
+async def orc(files: list[UploadFile] = Form(...)):
+    result = []
+    for file in files:
+        main = ResultMain()
+        main.file_name = file.filename
+        # 读取上传的文件内容
+        image_data = await file.read()
+
+        # 2. 将字节数据转换为 numpy 数组
+        np_array = np.frombuffer(image_data, np.uint8)
+
+        # 3. 使用 cv2.imdecode 解码为 OpenCV 图像
+        image = cv2.imdecode(np_array, cv2.IMREAD_COLOR)
+        new_image = preprocess_img(image)
+        datas = reader.readtext(np.array(new_image))
+        infos = []
+        for data in datas:
+            info = ResultInfo()
+            bounding_boxs = data[0]
+            left_up = bounding_boxs[0]
+            right_down = bounding_boxs[2]
+            info.bounding_box_left_up = [int(left_up[0]), int(left_up[1])]
+            info.bounding_box_right_down = [int(right_down[0]), int(right_down[1])]
+            info.text = data[1]
+            info.confidence = round(data[2], 4)
+            infos.append(info)
+        main.infos = infos
+        result.append(main.model_dump())
+    return SuccessResponse(data=result)
--- a/api/paddle_ocr_api.py
+++ b/api/paddle_ocr_api.py
@@ -0,0 +1,55 @@
+from core.response import SuccessResponse
+from fastapi import APIRouter, UploadFile, Form
+from schemas.orc_result import ResultInfo, ResultMain
+
+from paddleocr import PaddleOCR
+import numpy as np
+import cv2
+
+
+app = APIRouter()
+
+
+paddle_ocr = PaddleOCR(lang='ch')
+
+
+def enhance_image(img):
+    """增强亮部和暗部，提升数字清晰度"""
+    lab = cv2.cvtColor(img, cv2.COLOR_BGR2LAB)
+    l, a, b = cv2.split(lab)
+    clahe = cv2.createCLAHE(clipLimit=3.0, tileGridSize=(8,8))
+    cl = clahe.apply(l)
+    enhanced = cv2.merge((cl, a, b))
+    return cv2.cvtColor(enhanced, cv2.COLOR_LAB2BGR)
+
+
+@app.post("/upload")
+async def orc(files: list[UploadFile] = Form(...)):
+    result = []
+    for file in files:
+        main = ResultMain()
+        main.file_name = file.filename
+        # 读取上传的文件内容
+        image_data = await file.read()
+        # 从字节数据读取图像
+        np_array = np.frombuffer(image_data, np.uint8)
+        img = cv2.imdecode(np_array, cv2.IMREAD_COLOR)
+        # 图像增强
+        img = enhance_image(img)
+        # 4. 调用 OCR 模型进行识别
+        datas = paddle_ocr.ocr(img, cls=False)
+        infos = []
+        if datas:
+            for data in datas[0]:
+                info = ResultInfo()
+                bounding_boxs = data[0]
+                left_up = bounding_boxs[0]
+                right_down = bounding_boxs[2]
+                info.bounding_box_left_up = [int(left_up[0]), int(left_up[1])]
+                info.bounding_box_right_down = [int(right_down[0]), int(right_down[1])]
+                info.text = data[1][0]
+                info.confidence = round(data[1][1], 4)
+                infos.append(info)
+            main.infos = infos
+            result.append(main.model_dump())
+    return SuccessResponse(data=result)
--- a/application.py
+++ b/application.py
@@ -0,0 +1,24 @@
+from fastapi import FastAPI
+from fastapi.middleware.cors import CORSMiddleware
+
+from api.easy_orc_api import app as easy_orc_api
+
+from api.paddle_ocr_api import app as paddle_ocr_api
+
+
+app = FastAPI()
+
+
+'''
+添加cros中间件，允许跨域请求
+'''
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+
+app.include_router(paddle_ocr_api, prefix="/ocr", tags=["ocr识别"])
--- a/core/response.py
+++ b/core/response.py
@@ -0,0 +1,32 @@
+# 依赖安装：pip install orjson
+from fastapi.responses import ORJSONResponse as Response
+from fastapi import status as http_status
+from core import status as http
+
+
+class SuccessResponse(Response):
+    """
+    成功响应
+    """
+    def __init__(self, data=None, msg="success", code=http.HTTP_SUCCESS, status=http_status.HTTP_200_OK, **kwargs):
+        self.data = {
+            "code": code,
+            "message": msg,
+            "data": data
+        }
+        self.data.update(kwargs)
+        super().__init__(content=self.data, status_code=status)
+
+
+class ErrorResponse(Response):
+    """
+    失败响应
+    """
+    def __init__(self, msg=None, code=http.HTTP_ERROR, status=http_status.HTTP_200_OK, **kwargs):
+        self.data = {
+            "code": code,
+            "message": msg,
+            "data": []
+        }
+        self.data.update(kwargs)
+        super().__init__(content=self.data, status_code=status)
--- a/core/status.py
+++ b/core/status.py
@@ -0,0 +1,14 @@
+#!/usr/bin/python
+# -*- coding: utf-8 -*-
+# @version        : 1.0
+# @Create Time    : 2022/8/10 22:20 
+# @File           : status.py
+# @IDE            : PyCharm
+# @desc           : 简要说明
+
+
+HTTP_SUCCESS = 200
+HTTP_ERROR = 400
+HTTP_401_UNAUTHORIZED = 401
+HTTP_403_FORBIDDEN = 403
+HTTP_404_NOT_FOUND = 404
--- a/main.py
+++ b/main.py
@@ -0,0 +1,5 @@
+import uvicorn
+from application import app
+
+if __name__ == '__main__':
+    uvicorn.run("main:app", port=9800, reload=False, host='0.0.0.0')
--- a/model/zh_sim_g2.pth
+++ b/model/zh_sim_g2.pth
--- a/requirement.txt
+++ b/requirement.txt
@@ -0,0 +1,6 @@
+fastapi==0.112.2
+uvicorn==0.32.1
+easyocr==1.7.2
+orjson==3.10.16
+python-multipart==0.0.20
+paddleocr==2.10.0
--- a/schemas/orc_result.py
+++ b/schemas/orc_result.py
@@ -0,0 +1,18 @@
+from pydantic import BaseModel, ConfigDict, field_validator
+
+
+class ResultInfo(BaseModel):
+    bounding_box_left_up: list[int] | None = []
+    bounding_box_right_down: list[int] | None = []
+    text: str | None = None
+    confidence: float | None = None
+
+    model_config = ConfigDict(from_attributes=True)
+
+
+class ResultMain(BaseModel):
+    file_name: str | None = None
+    infos: list[ResultInfo] | None = []
+
+    model_config = ConfigDict(from_attributes=True)
+
--- a/utils/opencv_util.py
+++ b/utils/opencv_util.py
@@ -0,0 +1,17 @@
+# 增强对比度 + 灰度转换 + 自适应阈值
+import cv2
+
+img = cv2.imread("fb1df265-5085-4bc2-881b-7674b620c4ac.jpg")
+
+# 转灰度图
+gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+
+# 提升对比度
+clahe = cv2.createCLAHE(clipLimit=3.0, tileGridSize=(8, 8))
+enhanced = clahe.apply(gray)
+
+# 二值化处理
+binary = cv2.adaptiveThreshold(enhanced, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
+                               cv2.THRESH_BINARY_INV, 11, 2)
+
+cv2.imwrite("processed.png", binary)
--- a/utils/os_utils.py
+++ b/utils/os_utils.py
@@ -0,0 +1,39 @@
+import os
+from fastapi import UploadFile
+
+
+def file_path(*path):
+    """
+    拼接返回文件路径
+    :param path:
+    :return:
+    """
+    return_path = os.path.join(*path)
+    return return_path
+
+
+def create_folder(*path):
+    """根据路径创建文件夹"""
+    folder_path = os.path.join(*path)
+    try:
+        os.makedirs(folder_path, exist_ok=True)
+    except Exception as e:
+        print(f"创建文件夹时错误： {e}")
+    return folder_path
+
+
+def save_images(*path, file: UploadFile):
+    """
+    保存上传的图片
+    :param path: 路径
+    :param file: 文件
+    :return:
+    """
+    save_path = os.path.join(*path, file.filename)
+
+    os.makedirs(os.path.dirname(save_path), exist_ok=True)
+    with open(save_path, "wb") as f:
+        for line in file.file:
+            f.write(line)
+    return save_path
+
--- a/utils/pillow_util.py
+++ b/utils/pillow_util.py
@@ -0,0 +1,11 @@
+from PIL import Image, ImageEnhance
+
+# 加载图片
+img = Image.open("fb1df265-5085-4bc2-881b-7674b620c4ac.jpg")
+
+# 增强对比度（1.5 倍为示例，你可以调节参数）
+enhancer = ImageEnhance.Contrast(img)
+img_enhanced = enhancer.enhance(4.0)
+
+# 保存增强后的图像
+img_enhanced.save("enhanced_image_pillow.png")
				`@@ -0,0 +1 @@`
				`ocr demo,里面有两个模型一个是easyocr，一个是百度的paddleocr`