2 years ago · c0bc1870f6
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1,6 @@
 
				+__pycache__
			
 
				+venv
			
 
				+.idea
			
 
				+static/images/*
			
 
				+
			
 
				+test.py
			
--- a/Dockerfile
+++ b/Dockerfile
@@ -0,0 +1,15 @@
 
				+FROM python:3.9
			
 
				+
			
 
				+WORKDIR /srv
			
 
				+
			
 
				+COPY requires.cpu .
			
 
				+
			
 
				+ARG tuna=https://pypi.tuna.tsinghua.edu.cn/simple
			
 
				+
			
 
				+RUN pip install --no-cache-dir --upgrade pip -i $tuna && \
			
 
				+ pip install --no-cache-dir -r requires.cpu -i $tuna && \
			
 
				+ sed -i "s@http://deb.debian.org@https://mirrors.tuna.tsinghua.edu.cn@g" /etc/apt/sources.list && \
			
 
				+ apt update && apt install -y libgl1-mesa-glx --no-install-recommends && \
			
 
				+ apt-get clean && rm -rf /var/lib/apt/lists/*
			
 
				+
			
 
				+CMD ["gunicorn", "app:app"]
			
--- a/Readme.md
+++ b/Readme.md
@@ -0,0 +1,39 @@
 
				+## PaddleOCR API
			
 
				+
			
 
				+---
			
 
				+
			
 
				+**$host: https://img.ifarmcloud.com/ocr**
			
 
				+
			
 
				+**接口说明：[内网](http://192.168.1.6:10393/shareDoc?issue=df3c14ae8582a40ee191762f8fda504b) 、
			
 
				+[外网](https://console-docs.apipost.cn/preview/d46d3cce127f3856/39166dc588c72981)**
			
 
				+
			
 
				+**参数中： * 为必传参数**
			
 
				+
			
 
				+**返回数据：{success: "bool：是否成功", message: "text：说明信息", data: "json：数据主体"}**
			
 
				+
			
 
				+---
			
 
				+
			
 
				++ $host/  
			
 
				+  + 请求方法：GET、浏览器直接访问
			
 
				+  + 说明：在线测试演示首页
			
 
				+  + 详见：[HuiMv OCR Index](http://139.9.167.178:5050/)
			
 
				+
			
 
				++ $host/com/
			
 
				+  + 通用OCR接口
			
 
				+  + 请求方法：POST
			
 
				+  + 参数列表：
			
 
				+    + *picture: 待识别的图片文件
			
 
				+    + type: 操作类型（raw：原生OCR内容，filter：仅返回识别文字列表【默认】，html：结果以HTML展示）
			
 
				+  + 返回数据：JSON
			
 
				+  + 详见接口说明：[内网](http://192.168.1.6:10393/shareDoc?issue=4372c38974a592f95748939af1c40b52) 、
			
 
				+    [外网](https://console-docs.apipost.cn/preview/4cc8e896b0556775/953929384b227f1d)
			
 
				+
			
 
				++ $host/idc/
			
 
				+  + 大陆居民身份证识别接口
			
 
				+  + 请求方法：POST
			
 
				+  + 参数列表：
			
 
				+    + *picture: 待识别的图片文件
			
 
				+    + *which: 身份证正反面（face：人像面，icon：国徽面）
			
 
				+  + 返回数据：JSON
			
 
				+  + 详见接口说明：[内网](http://192.168.1.6:10393/shareDoc?issue=2f9f3334ea40558d20ba42057ffd45c2) 、
			
 
				+    [外网](https://console-docs.apipost.cn/preview/7da01bde77cb4e05/90734f27243d2309)
			
--- a/app.py
+++ b/app.py
@@ -0,0 +1,35 @@
 
				+from utils import conf
			
 
				+from blues import com, idc
			
 
				+from flask_cors import CORS
			
 
				+from flask import Flask, render_template, Response
			
 
				+
			
 
				+
			
 
				+def init() -> "Flask":
			
 
				+    this = Flask(__name__)
			
 
				+    CORS(this)
			
 
				+    this.config.from_object(conf)
			
 
				+
			
 
				+    this.register_blueprint(com)
			
 
				+    this.register_blueprint(idc)
			
 
				+
			
 
				+    return this
			
 
				+
			
 
				+
			
 
				+app = init()
			
 
				+
			
 
				+
			
 
				+@app.route("/")
			
 
				+def index():
			
 
				+    return render_template("navigate.html")
			
 
				+
			
 
				+
			
 
				+@app.route("/favicon.ico")
			
 
				+def icon():
			
 
				+    with open("static/html/favicon.png", "rb") as f:
			
 
				+        img = f.read()
			
 
				+        f.close()
			
 
				+    return Response(img, mimetype="image/x-png")
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    app.run(host=conf.SERVER_HOST, port=conf.SERVER_PORT)
			
--- a/blues/__init__.py
+++ b/blues/__init__.py
@@ -0,0 +1,2 @@
 
				+from .com import com
			
 
				+from .idc import idc
			
--- a/blues/com.py
+++ b/blues/com.py
@@ -0,0 +1,41 @@
 
				+from utils.util import *
			
 
				+from utils.conf import MAX_CONTENT_LENGTH
			
 
				+from flask import Blueprint, views, render_template, request
			
 
				+
			
 
				+com = Blueprint("com", __name__, url_prefix="/com")
			
 
				+
			
 
				+
			
 
				+class ComView(views.MethodView):
			
 
				+    @staticmethod
			
 
				+    def get():
			
 
				+        return render_template("com_index.html")
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def post():
			
 
				+        pic = request.files.get("picture")
			
 
				+        if pic is None:
			
 
				+            return Response("empty body")
			
 
				+        ext = get_ext_name(pic.filename)
			
 
				+        if not is_image_ext(ext):
			
 
				+            return Response("文件类型错误")
			
 
				+        content = pic.read()
			
 
				+        if len(content) > MAX_CONTENT_LENGTH:
			
 
				+            return Response("文件过大，请重新选择")
			
 
				+        file_path = f"static/images/{current_time()}_{rand_str()}.{ext}"
			
 
				+        save_img(file_path, content)
			
 
				+
			
 
				+        img = read_img(content)
			
 
				+        ocr_res = Engine.ocr_one(img, cls=True)
			
 
				+        kind = request.form.get("type")
			
 
				+        if kind is not None:
			
 
				+            kind = kind.lower()
			
 
				+        if kind == "raw":
			
 
				+            return Response(data=ocr_res)
			
 
				+        elif kind == "html":
			
 
				+            data = [{"word": it[0], "rate": it[1], "index": i + 1} for i, it in enumerate(ocr_res)]
			
 
				+            return render_template("com_result.html", raw=file_path, data=data)
			
 
				+        else:
			
 
				+            return Response(data=[it[0] for it in ocr_res])
			
 
				+
			
 
				+
			
 
				+com.add_url_rule("/", view_func=ComView.as_view("com"))
			
--- a/blues/idc.py
+++ b/blues/idc.py
@@ -0,0 +1,156 @@
 
				+import re
			
 
				+from time import time
			
 
				+from utils.util import *
			
 
				+from utils.conf import MAX_CONTENT_LENGTH
			
 
				+from flask import Blueprint, views, render_template, request
			
 
				+
			
 
				+idc = Blueprint("idc", __name__, url_prefix="/idc")
			
 
				+
			
 
				+__exclude = "中国CHINA *#★☆"
			
 
				+__face_ptn = r"^姓名(?P<name>.+)性别(?P<gender>男|女)民族(?P<nation>.+)" \
			
 
				+             r"出生(?P<year>\d{4})年(?P<month>\d\d)月(?P<day>\d\d)日" \
			
 
				+             r"住址(?P<addr>.+)公民身份号码(?P<idn>\d{17}\d|x|X)$"
			
 
				+__icon_ptn = r"^中华人民共和国居民身份证签发机关(?P<agent>.+)" \
			
 
				+             r"有效期限(?P<from_year>\d{4})\.(?P<from_month>\d{2})\.(?P<from_day>\d{2})" \
			
 
				+             r"[^\d]+(?P<to_year>\d{4})\.(?P<to_month>\d{2})\.(?P<to_day>\d{2})$"
			
 
				+
			
 
				+
			
 
				+def get_face_info(data: "list[str]") -> "tuple[dict, str, bool]":
			
 
				+    res = {"name": "", "gender": "", "nation": "", "birth": {"year": "", "month": "", "day": ""}, "addr": "", "idn": ""}
			
 
				+    if len(data) < 5:  # 最少 5 个识别结果
			
 
				+        return res, "请使用正确的身份证人像面照片", False
			
 
				+
			
 
				+    str_all = "".join([item for item in data if not str_include(__exclude, item)])
			
 
				+    if match := re.match(__face_ptn, str_all):
			
 
				+        res["name"] = match.group("name")
			
 
				+        res["gender"] = match.group("gender")
			
 
				+        res["nation"] = match.group("nation")
			
 
				+        res["birth"] = {
			
 
				+            "year": match.group("year"),
			
 
				+            "month": match.group("month"),
			
 
				+            "day": match.group("day")
			
 
				+        }
			
 
				+        res["addr"] = match.group("addr")
			
 
				+        res["idn"] = match.group("idn")
			
 
				+        return res, str_all, True
			
 
				+
			
 
				+    return res, "识别失败，请重新选择", False
			
 
				+
			
 
				+
			
 
				+def get_icon_info(data: "list[str]"):
			
 
				+    res = {"agent": "", "from": {"year": "", "month": "", "day": ""}, "to": {"year": "", "month": "", "day": ""}}
			
 
				+    if len(data) < 4:  # 最少 4 个识别结果
			
 
				+        return res, "请使用正确的身份证国徽面照片", False
			
 
				+
			
 
				+    str_all = "".join([item for item in data if not str_include(__exclude, item)])
			
 
				+    if match := re.match(__icon_ptn, str_all):
			
 
				+        res["agent"] = match.group("agent")
			
 
				+        res["from"] = {
			
 
				+            "year": match.group("from_year"),
			
 
				+            "month": match.group("from_month"),
			
 
				+            "day": match.group("from_day"),
			
 
				+        }
			
 
				+        res["to"] = {
			
 
				+            "year": match.group("to_year"),
			
 
				+            "month": match.group("to_month"),
			
 
				+            "day": match.group("to_day"),
			
 
				+        }
			
 
				+        return res, str_all, True
			
 
				+    return res, "识别失败，请重新选择", False
			
 
				+
			
 
				+
			
 
				+class IdcView(views.MethodView):
			
 
				+    @staticmethod
			
 
				+    def get():
			
 
				+        return render_template("idc_index.html")
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def post():
			
 
				+        start = time()
			
 
				+        which = request.form.get("which")
			
 
				+        if which is not None:
			
 
				+            which = which.lower()
			
 
				+        if which not in ["face", "icon"]:
			
 
				+            return Response(f"not recognized arg <which>: '{which}'")
			
 
				+        pic = request.files.get("picture")
			
 
				+        if pic is None:
			
 
				+            return Response("empty body")
			
 
				+        ext = get_ext_name(pic.filename)
			
 
				+        if not is_image_ext(ext):
			
 
				+            return Response("文件类型错误")
			
 
				+        content = pic.read()
			
 
				+        if len(content) > MAX_CONTENT_LENGTH:
			
 
				+            return Response("文件过大，请重新选择")
			
 
				+
			
 
				+        img = read_img(content)
			
 
				+        images = rot_img(img)
			
 
				+        rec = Engine.ocr_multi(images, cls=True, use_space=False)
			
 
				+        info, msg, sta, idx = {}, "识别失败，请重新选择", False, 0
			
 
				+        for idx, ocr_res in enumerate(rec):
			
 
				+            words = [it[0].replace(" ", "") for it in ocr_res]
			
 
				+            if which == "face":
			
 
				+                if not words or not words[0].startswith("姓名"):
			
 
				+                    continue
			
 
				+                info, msg, sta = get_face_info(words)
			
 
				+            else:
			
 
				+                if not words or not words[0].startswith("中华"):
			
 
				+                    continue
			
 
				+                info, msg, sta = get_icon_info(words)
			
 
				+            if sta:
			
 
				+                break
			
 
				+
			
 
				+        info["duration"] = time() - start
			
 
				+        if sta:
			
 
				+            raw_path = f"static/images/{current_time()}_{rand_str()}.{ext}"
			
 
				+            save_img(raw_path, images[idx])
			
 
				+            return Response(data=info)
			
 
				+        return Response(msg, info)
			
 
				+
			
 
				+
			
 
				+class IdcHtmlView(views.MethodView):
			
 
				+    @staticmethod
			
 
				+    def post():
			
 
				+        start = time()
			
 
				+        which = request.form.get("which")
			
 
				+        if which is not None:
			
 
				+            which = which.lower()
			
 
				+        if which not in ["face", "icon"]:
			
 
				+            return Response(f"not recognized arg <which>: '{which}'")
			
 
				+        pic = request.files.get("picture")
			
 
				+        if pic is None:
			
 
				+            return Response("empty body")
			
 
				+        ext = get_ext_name(pic.filename)
			
 
				+        if not is_image_ext(ext):
			
 
				+            return Response("文件类型错误")
			
 
				+        content = pic.read()
			
 
				+        if len(content) > MAX_CONTENT_LENGTH:
			
 
				+            return Response("文件过大，请重新选择")
			
 
				+
			
 
				+        img = read_img(content)
			
 
				+        images = rot_img(img)
			
 
				+        rec = Engine.ocr_multi(images, cls=True, use_space=False)
			
 
				+        info, msg, sta, idx = {}, "识别失败，请重新选择", False, 0
			
 
				+        for idx, ocr_res in enumerate(rec):
			
 
				+            words = [it[0].replace(" ", "") for it in ocr_res]
			
 
				+            if which == "face":
			
 
				+                if not words or not words[0].startswith("姓名"):
			
 
				+                    continue
			
 
				+                info, msg, sta = get_face_info(words)
			
 
				+            else:
			
 
				+                if not words or not words[0].startswith("中华"):
			
 
				+                    continue
			
 
				+                info, msg, sta = get_icon_info(words)
			
 
				+            if sta:
			
 
				+                break
			
 
				+
			
 
				+        file_path = f"static/images/{current_time()}_{rand_str()}.{ext}"
			
 
				+        save_img(file_path, images[idx])
			
 
				+
			
 
				+        info["SUCCESS"] = str(sta).upper()
			
 
				+        info["MESSAGE"] = msg
			
 
				+        info["DURATION"] = time() - start  # noqa
			
 
				+        return render_template("k-v_result.html", raw=file_path, data=info)
			
 
				+
			
 
				+
			
 
				+idc.add_url_rule("/", view_func=IdcView.as_view("idc"))
			
 
				+idc.add_url_rule("/html/", view_func=IdcHtmlView.as_view("idc-html"))
			
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -0,0 +1,12 @@
 
				+version: "3"
			
 
				+
			
 
				+services:
			
 
				+  PaddleOCR:
			
 
				+    build: .
			
 
				+    ports:
			
 
				+      - "5050:80"
			
 
				+    image: ocr:latest
			
 
				+    container_name: PaddleOCR
			
 
				+    restart: unless-stopped
			
 
				+    volumes:
			
 
				+      - ./:/srv/
			
--- a/gunicorn.conf.py
+++ b/gunicorn.conf.py
@@ -0,0 +1,3 @@
 
				+bind = "0.0.0.0:80"
			
 
				+worker_class = "gevent"
			
 
				+workers = 2
			
--- a/hmOCR/__init__.py
+++ b/hmOCR/__init__.py
@@ -0,0 +1,3 @@
 
				+from .core import HuiMvOcr
			
 
				+from .argument import Args, ArgType
			
 
				+from .utility import *
			
--- a/hmOCR/argument.py
+++ b/hmOCR/argument.py
@@ -0,0 +1,41 @@
 
				+__all__ = ["Args", "ArgType"]
			
 
				+
			
 
				+
			
 
				+class Args:
			
 
				+    def __init__(self, **kwargs):
			
 
				+        self.__update(
			
 
				+            use_gpu=False, precision="fp32", use_tensorrt=False,
			
 
				+            # gpu
			
 
				+            gpu_mem=500, max_batch_size=6, min_subgraph_size=15,
			
 
				+            # cpu
			
 
				+            enable_mkldnn=True, cpu_threads=16,
			
 
				+            # detector
			
 
				+            det_model_dir="hmOCR/static/det", det_algorithm="DB", det_limit_side_len=960,
			
 
				+            det_limit_type="max", det_db_thresh=0.3, det_db_box_thresh=0.6, det_db_unclip_ratio=1.5,
			
 
				+            det_use_dilation=False, det_db_score_mode="fast", det_box_type="quad",
			
 
				+            # classifier
			
 
				+            cls_model_dir="hmOCR/static/cls", cls_image_shape="3, 48, 192",
			
 
				+            cls_batch_num=6, cls_thresh=0.9, cls_label_list=["0", "180"],
			
 
				+            # recognizer
			
 
				+            rec_model_dir="hmOCR/static/rec", rec_algorithm="SVTR_LCNet",
			
 
				+            rec_image_shape="3, 48, 320", rec_batch_num=8, max_text_length=25,
			
 
				+            rec_char_dict_path="hmOCR/static/key-set.txt", use_space_char=False,
			
 
				+            # OCR
			
 
				+            drop_score=0.5,
			
 
				+            # test
			
 
				+            image_dir="static/test_image", warmup=True
			
 
				+        )
			
 
				+        self.__update(**kwargs)
			
 
				+
			
 
				+    def __update(self, **kwargs):
			
 
				+        for k, v in kwargs.items():
			
 
				+            self.__dict__[k] = v
			
 
				+
			
 
				+    def __getattr__(self, key: "str"):
			
 
				+        return self.__dict__[key]
			
 
				+
			
 
				+    def __setattr__(self, key: "str", value):
			
 
				+        self.__dict__[key] = value
			
 
				+
			
 
				+
			
 
				+ArgType = Args
			
--- a/hmOCR/core.py
+++ b/hmOCR/core.py
@@ -0,0 +1,56 @@
 
				+from .parts import *
			
 
				+from .utility import *
			
 
				+from copy import deepcopy
			
 
				+from .argument import ArgType
			
 
				+from concurrent.futures import ThreadPoolExecutor
			
 
				+
			
 
				+__all__ = ["HuiMvOcr"]
			
 
				+
			
 
				+
			
 
				+class HuiMvOcr:
			
 
				+    __worker_count = 1
			
 
				+
			
 
				+    def __init__(self, args: "ArgType"):
			
 
				+        self.det = Detector(args)
			
 
				+        self.cls = Classifier(args)
			
 
				+        self.rec = Recognizer(args)
			
 
				+
			
 
				+        self.det_box_type = args.det_box_type
			
 
				+        self.drop_score = args.drop_score
			
 
				+        self.crop_image_res_index = 0
			
 
				+
			
 
				+    def ocr_one(self, img, cls: "bool" = False, use_space: "bool" = True):
			
 
				+        ori_im = img.copy()
			
 
				+        dt_boxes = self.det(img)
			
 
				+        if dt_boxes is None:
			
 
				+            return None
			
 
				+
			
 
				+        dt_boxes = sorted_boxes(dt_boxes)
			
 
				+        size = len(dt_boxes)
			
 
				+        img_crop_list = [...] * size
			
 
				+
			
 
				+        for i in range(size):
			
 
				+            box = deepcopy(dt_boxes[i])
			
 
				+            if self.det_box_type == "quad":
			
 
				+                img_crop_list[i] = get_rotate_crop_image(ori_im, box)
			
 
				+            else:
			
 
				+                img_crop_list[i] = get_min_area_rect_crop(ori_im, box)
			
 
				+
			
 
				+        if cls:
			
 
				+            img_crop_list = self.cls(img_crop_list)
			
 
				+
			
 
				+        rec_res = self.rec(img_crop_list, use_space=use_space)
			
 
				+
			
 
				+        filter_rec_res = []
			
 
				+        for text, score in rec_res:
			
 
				+            if score > self.drop_score:
			
 
				+                filter_rec_res.append((text, score))
			
 
				+
			
 
				+        return filter_rec_res
			
 
				+
			
 
				+    def ocr_multi(self, img_list, cls: "bool" = False, use_space: "bool" = True):
			
 
				+        pool = ThreadPoolExecutor(HuiMvOcr.__worker_count)
			
 
				+        loop = range(len(img_list))
			
 
				+        tasks = [pool.submit(self.ocr_one, img_list[i], cls, use_space) for i in loop]
			
 
				+
			
 
				+        return [tasks[i].result() for i in loop]
			
--- a/hmOCR/enter.py
+++ b/hmOCR/enter.py
@@ -0,0 +1,47 @@
 
				+import cv2
			
 
				+import numpy as np
			
 
				+from utility import *
			
 
				+from argument import *
			
 
				+from core import HuiMvOcr
			
 
				+from time import time
			
 
				+
			
 
				+
			
 
				+def main(args: "ArgType"):
			
 
				+    image_file_list = get_image_file_list(args.image_dir)
			
 
				+    engine = HuiMvOcr(args)
			
 
				+
			
 
				+    # warm up 10 times
			
 
				+    if args.warmup:
			
 
				+        img = np.random.uniform(0, 255, [640, 640, 3]).astype(np.uint8)
			
 
				+        for i in range(10):
			
 
				+            engine.ocr_one(img)
			
 
				+    # single
			
 
				+    print("single start")
			
 
				+    total_time, res = 0, []
			
 
				+    for image_file in image_file_list:
			
 
				+        img, flag_gif = check_and_read(image_file)
			
 
				+        if not flag_gif:
			
 
				+            img = cv2.imread(image_file)  # noqa
			
 
				+        st = time()
			
 
				+        rec_res = engine.ocr_one(img, cls=True, use_space=False)
			
 
				+        elapse = time() - st
			
 
				+        total_time += elapse
			
 
				+        res.append(rec_res)
			
 
				+    print(f"single total time: {total_time}")
			
 
				+    for i in range(len(res)):
			
 
				+        print(f"file: {image_file_list[i]}")
			
 
				+        print("res:", res[i])
			
 
				+
			
 
				+    # multi
			
 
				+    images = [cv2.imread(file) for file in image_file_list]  # noqa
			
 
				+    print("\n\nmulti start")
			
 
				+    st = time()
			
 
				+    res = engine.ocr_multi(images, cls=True, use_space=False)
			
 
				+    print(f"multi total time {time() - st}")
			
 
				+    for i in range(len(res)):
			
 
				+        print(f"file: {image_file_list[i]}")
			
 
				+        print("res:", res[i])
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    main(Args())
			
--- a/hmOCR/parts/__init__.py
+++ b/hmOCR/parts/__init__.py
@@ -0,0 +1,5 @@
 
				+from .detector import Detector
			
 
				+from .classifier import Classifier
			
 
				+from .recognizer import Recognizer
			
 
				+
			
 
				+__all__ = ["Detector", "Classifier", "Recognizer"]
			
--- a/hmOCR/parts/classifier.py
+++ b/hmOCR/parts/classifier.py
@@ -0,0 +1,80 @@
 
				+import cv2
			
 
				+import math
			
 
				+import numpy as np
			
 
				+from .utils import *
			
 
				+from copy import deepcopy
			
 
				+from hmOCR.argument import Args
			
 
				+
			
 
				+
			
 
				+class Classifier:
			
 
				+    def __init__(self, args: "Args"):
			
 
				+        self.cls_image_shape = [int(v) for v in args.cls_image_shape.split(",")]
			
 
				+        self.cls_batch_num = args.cls_batch_num
			
 
				+        self.cls_thresh = args.cls_thresh
			
 
				+        postprocess_params = {
			
 
				+            "name": "ClsPostProcess",
			
 
				+            "label_list": args.cls_label_list
			
 
				+        }
			
 
				+        self.postprocess_op = build_post_process(postprocess_params)
			
 
				+        self.predictor, self.input_tensor, self.output_tensors = create_predictor(args, "cls")
			
 
				+
			
 
				+    def resize_norm_img(self, img):
			
 
				+        imgC, imgH, imgW = self.cls_image_shape
			
 
				+        h = img.shape[0]
			
 
				+        w = img.shape[1]
			
 
				+        ratio = w / float(h)
			
 
				+        if math.ceil(imgH * ratio) > imgW:
			
 
				+            resized_w = imgW
			
 
				+        else:
			
 
				+            resized_w = int(math.ceil(imgH * ratio))
			
 
				+        resized_image = cv2.resize(img, (resized_w, imgH))  # noqa
			
 
				+        resized_image = resized_image.astype("float32")
			
 
				+        if self.cls_image_shape[0] == 1:
			
 
				+            resized_image = resized_image / 255
			
 
				+            resized_image = resized_image[np.newaxis, :]
			
 
				+        else:
			
 
				+            resized_image = resized_image.transpose((2, 0, 1)) / 255
			
 
				+        resized_image -= 0.5
			
 
				+        resized_image /= 0.5
			
 
				+        padding_im = np.zeros((imgC, imgH, imgW), dtype=np.float32)
			
 
				+        padding_im[:, :, 0:resized_w] = resized_image
			
 
				+        return padding_im
			
 
				+
			
 
				+    def __call__(self, img_list):
			
 
				+        img_list = deepcopy(img_list)
			
 
				+        img_num = len(img_list)
			
 
				+        # Calculate the aspect ratio of all text bars
			
 
				+        width_list = []
			
 
				+        for img in img_list:
			
 
				+            width_list.append(img.shape[1] / float(img.shape[0]))
			
 
				+        # Sorting can speed up the cls process
			
 
				+        indices = np.argsort(np.array(width_list))
			
 
				+
			
 
				+        batch_num = self.cls_batch_num
			
 
				+
			
 
				+        for beg_img_no in range(0, img_num, batch_num):
			
 
				+            end_img_no = min(img_num, beg_img_no + batch_num)
			
 
				+            norm_img_batch = []
			
 
				+            max_wh_ratio = 0
			
 
				+            for ino in range(beg_img_no, end_img_no):
			
 
				+                h, w = img_list[indices[ino]].shape[0:2]
			
 
				+                wh_ratio = w * 1.0 / h
			
 
				+                max_wh_ratio = max(max_wh_ratio, wh_ratio)
			
 
				+            for ino in range(beg_img_no, end_img_no):
			
 
				+                norm_img = self.resize_norm_img(img_list[indices[ino]])
			
 
				+                norm_img = norm_img[np.newaxis, :]
			
 
				+                norm_img_batch.append(norm_img)
			
 
				+            norm_img_batch = np.concatenate(norm_img_batch)
			
 
				+            norm_img_batch = norm_img_batch.copy()
			
 
				+
			
 
				+            self.input_tensor.copy_from_cpu(norm_img_batch)
			
 
				+            self.predictor.run()
			
 
				+            prob_out = self.output_tensors[0].copy_to_cpu()
			
 
				+            self.predictor.try_shrink_memory()
			
 
				+
			
 
				+            cls_result = self.postprocess_op(prob_out)
			
 
				+            for rno in range(len(cls_result)):
			
 
				+                label, score = cls_result[rno]
			
 
				+                if "180" in label and score > self.cls_thresh:
			
 
				+                    img_list[indices[beg_img_no + rno]] = cv2.rotate(img_list[indices[beg_img_no + rno]], 1)  # noqa
			
 
				+        return img_list
			
--- a/hmOCR/parts/detector.py
+++ b/hmOCR/parts/detector.py
@@ -0,0 +1,111 @@
 
				+import numpy as np
			
 
				+from .utils import *
			
 
				+from hmOCR.argument import Args
			
 
				+
			
 
				+
			
 
				+class Detector:
			
 
				+    def __init__(self, args: "Args"):
			
 
				+        self.det_algorithm = args.det_algorithm  # DB
			
 
				+        self.det_box_type = args.det_box_type
			
 
				+        pre_process_list = [{
			
 
				+            "DetResizeForTest": {
			
 
				+                "limit_side_len": args.det_limit_side_len,
			
 
				+                "limit_type": args.det_limit_type,
			
 
				+            }
			
 
				+        }, {
			
 
				+            "NormalizeImage": {
			
 
				+                "std": [0.229, 0.224, 0.225],
			
 
				+                "mean": [0.485, 0.456, 0.406],
			
 
				+                "scale": 1 / 255,
			
 
				+                "order": "hwc"
			
 
				+            }
			
 
				+        }, {
			
 
				+            "ToCHWImage": None
			
 
				+        }, {
			
 
				+            "KeepKeys": {
			
 
				+                "keep_keys": ["image", "shape"]
			
 
				+            }
			
 
				+        }]
			
 
				+        postprocess_params = {
			
 
				+            "name": "DBPostProcess", "thresh": args.det_db_thresh,
			
 
				+            "box_thresh": args.det_db_box_thresh, "max_candidates": 1000,
			
 
				+            "unclip_ratio": args.det_db_unclip_ratio, "use_dilation": args.det_use_dilation,
			
 
				+            "score_mode": args.det_db_score_mode, "box_type": args.det_box_type
			
 
				+        }
			
 
				+
			
 
				+        self.pre_operator = create_operators(pre_process_list)
			
 
				+        self.post_operator = build_post_process(postprocess_params)
			
 
				+        self.predictor, self.input_tensor, self.output_tensors = create_predictor(args, "det")
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def order_points_clockwise(pts):
			
 
				+        rect = np.zeros((4, 2), dtype="float32")
			
 
				+        s = pts.sum(axis=1)
			
 
				+        rect[0] = pts[np.argmin(s)]
			
 
				+        rect[2] = pts[np.argmax(s)]
			
 
				+        tmp = np.delete(pts, (np.argmin(s), np.argmax(s)), axis=0)
			
 
				+        diff = np.diff(np.array(tmp), axis=1)
			
 
				+        rect[1] = tmp[np.argmin(diff)]
			
 
				+        rect[3] = tmp[np.argmax(diff)]
			
 
				+        return rect
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def clip_det_res(points, img_height, img_width):
			
 
				+        for pno in range(points.shape[0]):
			
 
				+            points[pno, 0] = int(min(max(points[pno, 0], 0), img_width - 1))
			
 
				+            points[pno, 1] = int(min(max(points[pno, 1], 0), img_height - 1))
			
 
				+        return points
			
 
				+
			
 
				+    def filter_tag_det_res(self, dt_boxes, image_shape):
			
 
				+        img_height, img_width = image_shape[0:2]
			
 
				+        dt_boxes_new = []
			
 
				+        for box in dt_boxes:
			
 
				+            if type(box) is list:
			
 
				+                box = np.array(box)
			
 
				+            box = self.order_points_clockwise(box)
			
 
				+            box = self.clip_det_res(box, img_height, img_width)
			
 
				+            rect_width = int(np.linalg.norm(box[0] - box[1]))
			
 
				+            rect_height = int(np.linalg.norm(box[0] - box[3]))
			
 
				+            if rect_width <= 3 or rect_height <= 3:
			
 
				+                continue
			
 
				+            dt_boxes_new.append(box)
			
 
				+        dt_boxes = np.array(dt_boxes_new)
			
 
				+        return dt_boxes
			
 
				+
			
 
				+    def filter_tag_det_res_only_clip(self, dt_boxes, image_shape):
			
 
				+        img_height, img_width = image_shape[0:2]
			
 
				+        dt_boxes_new = []
			
 
				+        for box in dt_boxes:
			
 
				+            if type(box) is list:
			
 
				+                box = np.array(box)
			
 
				+            box = self.clip_det_res(box, img_height, img_width)
			
 
				+            dt_boxes_new.append(box)
			
 
				+        dt_boxes = np.array(dt_boxes_new)
			
 
				+        return dt_boxes
			
 
				+
			
 
				+    def __call__(self, img):
			
 
				+        ori_im = img.copy()
			
 
				+        data = {"image": img}
			
 
				+
			
 
				+        data = transform(data, self.pre_operator)
			
 
				+        img, shape_list = data
			
 
				+        if img is None:
			
 
				+            return None
			
 
				+        img = np.expand_dims(img, axis=0)
			
 
				+        shape_list = np.expand_dims(shape_list, axis=0)
			
 
				+        img = img.copy()
			
 
				+
			
 
				+        self.input_tensor.copy_from_cpu(img)
			
 
				+        self.predictor.run()
			
 
				+
			
 
				+        outputs = [out.copy_to_cpu() for out in self.output_tensors]
			
 
				+        preds = {"maps": outputs[0]}
			
 
				+        post_result = self.post_operator(preds, shape_list)
			
 
				+        dt_boxes = post_result[0]["points"]
			
 
				+
			
 
				+        if self.det_box_type == "poly":
			
 
				+            dt_boxes = self.filter_tag_det_res_only_clip(dt_boxes, ori_im.shape)
			
 
				+        else:
			
 
				+            dt_boxes = self.filter_tag_det_res(dt_boxes, ori_im.shape)
			
 
				+
			
 
				+        return dt_boxes
			
--- a/hmOCR/parts/operator.py
+++ b/hmOCR/parts/operator.py
@@ -0,0 +1,450 @@
 
				+import re
			
 
				+import cv2
			
 
				+import pyclipper
			
 
				+import numpy as np
			
 
				+from PIL import Image
			
 
				+from paddle import Tensor
			
 
				+from shapely.geometry import Polygon
			
 
				+
			
 
				+__all__ = [
			
 
				+    "DetResizeForTest", "NormalizeImage", "ToCHWImage", "KeepKeys",
			
 
				+    "DBPostProcess", "ClsPostProcess", "CTCLabelDecode"
			
 
				+]
			
 
				+
			
 
				+
			
 
				+class DetResizeForTest:
			
 
				+    def __init__(self, **kwargs):
			
 
				+        if "limit_side_len" in kwargs:
			
 
				+            self.limit_side_len = kwargs["limit_side_len"]
			
 
				+            self.limit_type = kwargs.get("limit_type", "min")
			
 
				+        else:
			
 
				+            self.limit_side_len = 736
			
 
				+            self.limit_type = "min"
			
 
				+
			
 
				+    def __call__(self, data):
			
 
				+        img = data["image"]
			
 
				+        src_h, src_w, _ = img.shape
			
 
				+        if sum([src_h, src_w]) < 64:
			
 
				+            img = self.image_padding(img)
			
 
				+
			
 
				+        img, [ratio_h, ratio_w] = self.resize_image_type0(img)
			
 
				+        data["image"] = img
			
 
				+        data["shape"] = np.array([src_h, src_w, ratio_h, ratio_w])
			
 
				+        return data
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def image_padding(im, value=0):
			
 
				+        h, w, c = im.shape
			
 
				+        im_pad = np.zeros((max(32, h), max(32, w), c), np.uint8) + value
			
 
				+        im_pad[:h, :w, :] = im
			
 
				+        return im_pad
			
 
				+
			
 
				+    def resize_image_type0(self, img):
			
 
				+        """
			
 
				+        resize image to a size multiple of 32 which is required by the network
			
 
				+        args:
			
 
				+            img(array): array with shape [h, w, c]
			
 
				+        return(tuple):
			
 
				+            img, (ratio_h, ratio_w)
			
 
				+        """
			
 
				+        limit_side_len = self.limit_side_len
			
 
				+        h, w, c = img.shape
			
 
				+
			
 
				+        # limit the max side
			
 
				+        if self.limit_type == "max":
			
 
				+            if max(h, w) > limit_side_len:
			
 
				+                if h > w:
			
 
				+                    ratio = float(limit_side_len) / h
			
 
				+                else:
			
 
				+                    ratio = float(limit_side_len) / w
			
 
				+            else:
			
 
				+                ratio = 1.
			
 
				+        elif self.limit_type == "min":
			
 
				+            if min(h, w) < limit_side_len:
			
 
				+                if h < w:
			
 
				+                    ratio = float(limit_side_len) / h
			
 
				+                else:
			
 
				+                    ratio = float(limit_side_len) / w
			
 
				+            else:
			
 
				+                ratio = 1.
			
 
				+        elif self.limit_type == "resize_long":
			
 
				+            ratio = float(limit_side_len) / max(h, w)
			
 
				+        else:
			
 
				+            raise Exception("not support limit type, image ")
			
 
				+        resize_h = int(h * ratio)
			
 
				+        resize_w = int(w * ratio)
			
 
				+
			
 
				+        resize_h = max(int(round(resize_h / 32) * 32), 32)
			
 
				+        resize_w = max(int(round(resize_w / 32) * 32), 32)
			
 
				+
			
 
				+        try:
			
 
				+            if int(resize_w) <= 0 or int(resize_h) <= 0:
			
 
				+                return None, (None, None)
			
 
				+            img = cv2.resize(img, (int(resize_w), int(resize_h)))  # noqa
			
 
				+        except Exception as e:
			
 
				+            print(img.shape, resize_w, resize_h, e)
			
 
				+            exit(0)
			
 
				+        ratio_h = resize_h / float(h)
			
 
				+        ratio_w = resize_w / float(w)
			
 
				+        return img, [ratio_h, ratio_w]
			
 
				+
			
 
				+
			
 
				+class NormalizeImage:
			
 
				+    def __init__(self, scale, mean, std, order="chw"):
			
 
				+        self.scale = np.float32(scale)
			
 
				+        shape = (3, 1, 1) if order == "chw" else (1, 1, 3)
			
 
				+        self.mean = np.array(mean).reshape(shape).astype("float32")
			
 
				+        self.std = np.array(std).reshape(shape).astype("float32")
			
 
				+
			
 
				+    def __call__(self, data):
			
 
				+        img = data["image"]
			
 
				+        if isinstance(img, Image.Image):
			
 
				+            img = np.array(img)  # noqa
			
 
				+        assert isinstance(img, np.ndarray), "invalid input img in NormalizeImage"
			
 
				+        data["image"] = (img.astype("float32") * self.scale - self.mean) / self.std
			
 
				+        return data
			
 
				+
			
 
				+
			
 
				+class ToCHWImage:
			
 
				+    def __call__(self, data):
			
 
				+        img = data["image"]
			
 
				+        if isinstance(img, Image.Image):
			
 
				+            img = np.array(img)  # noqa
			
 
				+        data["image"] = img.transpose((2, 0, 1))
			
 
				+        return data
			
 
				+
			
 
				+
			
 
				+class KeepKeys:
			
 
				+    def __init__(self, keep_keys):
			
 
				+        self.keep_keys = keep_keys
			
 
				+
			
 
				+    def __call__(self, data):
			
 
				+        return [data[key] for key in self.keep_keys]
			
 
				+
			
 
				+
			
 
				+class DBPostProcess:
			
 
				+    def __init__(
			
 
				+            self, thresh=0.3, box_thresh=0.7, max_candidates=1000, unclip_ratio=2.0,
			
 
				+            use_dilation=False, score_mode="fast", box_type="quad"
			
 
				+    ):
			
 
				+        self.thresh = thresh
			
 
				+        self.box_thresh = box_thresh
			
 
				+        self.max_candidates = max_candidates
			
 
				+        self.unclip_ratio = unclip_ratio
			
 
				+        self.min_size = 3
			
 
				+        self.score_mode = score_mode
			
 
				+        self.box_type = box_type
			
 
				+        assert score_mode in [
			
 
				+            "slow", "fast"
			
 
				+        ], f"Score mode must be in [slow, fast] but got: {score_mode}"
			
 
				+
			
 
				+        self.dilation_kernel = None if not use_dilation else np.array(
			
 
				+            [[1, 1], [1, 1]])
			
 
				+
			
 
				+    def polygons_from_bitmap(self, pred, _bitmap, dest_width, dest_height):
			
 
				+        """
			
 
				+        _bitmap: single map with shape (1, H, W), whose values are binarized as {0, 1}
			
 
				+        """
			
 
				+
			
 
				+        bitmap = _bitmap
			
 
				+        height, width = bitmap.shape
			
 
				+        boxes, scores = [], []
			
 
				+
			
 
				+        contours, _ = cv2.findContours((bitmap * 255).astype(np.uint8), cv2.RETR_LIST, cv2.CHAIN_APPROX_SIMPLE)  # noqa
			
 
				+
			
 
				+        for contour in contours[:self.max_candidates]:
			
 
				+            epsilon = 0.002 * cv2.arcLength(contour, True)  # noqa
			
 
				+            approx = cv2.approxPolyDP(contour, epsilon, True)  # noqa
			
 
				+            points = approx.reshape((-1, 2))
			
 
				+            if points.shape[0] < 4:
			
 
				+                continue
			
 
				+
			
 
				+            score = self.box_score_fast(pred, points.reshape(-1, 2))
			
 
				+            if self.box_thresh > score:
			
 
				+                continue
			
 
				+
			
 
				+            if points.shape[0] > 2:
			
 
				+                box = self.unclip(points, self.unclip_ratio)
			
 
				+                if len(box) > 1:
			
 
				+                    continue
			
 
				+            else:
			
 
				+                continue
			
 
				+            box = box.reshape(-1, 2)
			
 
				+
			
 
				+            _, s_side = self.get_mini_boxes(box.reshape((-1, 1, 2)))
			
 
				+            if s_side < self.min_size + 2:
			
 
				+                continue
			
 
				+
			
 
				+            box = np.array(box)
			
 
				+            box[:, 0] = np.clip(
			
 
				+                np.round(box[:, 0] / width * dest_width), 0, dest_width)
			
 
				+            box[:, 1] = np.clip(
			
 
				+                np.round(box[:, 1] / height * dest_height), 0, dest_height)
			
 
				+            boxes.append(box.tolist())
			
 
				+            scores.append(score)
			
 
				+        return boxes, scores
			
 
				+
			
 
				+    def boxes_from_bitmap(self, pred, _bitmap, dest_width, dest_height):
			
 
				+        """
			
 
				+        _bitmap: single map with shape (1, H, W), whose values are binarized as {0, 1}
			
 
				+        """
			
 
				+
			
 
				+        bitmap, contours = _bitmap, None
			
 
				+        height, width = bitmap.shape
			
 
				+
			
 
				+        outs = cv2.findContours((bitmap * 255).astype(np.uint8), cv2.RETR_LIST, cv2.CHAIN_APPROX_SIMPLE)  # noqa
			
 
				+        if len(outs) == 3:
			
 
				+            img, contours, _ = outs[0], outs[1], outs[2]
			
 
				+        elif len(outs) == 2:
			
 
				+            contours, _ = outs[0], outs[1]
			
 
				+
			
 
				+        num_contours = min(len(contours), self.max_candidates)
			
 
				+
			
 
				+        boxes = []
			
 
				+        scores = []
			
 
				+        for index in range(num_contours):
			
 
				+            contour = contours[index]
			
 
				+            points, s_side = self.get_mini_boxes(contour)
			
 
				+            if s_side < self.min_size:
			
 
				+                continue
			
 
				+            points = np.array(points)
			
 
				+            if self.score_mode == "fast":
			
 
				+                score = self.box_score_fast(pred, points.reshape(-1, 2))
			
 
				+            else:
			
 
				+                score = self.box_score_slow(pred, contour)
			
 
				+            if self.box_thresh > score:
			
 
				+                continue
			
 
				+
			
 
				+            box = self.unclip(points, self.unclip_ratio).reshape(-1, 1, 2)  # noqa
			
 
				+            box, s_side = self.get_mini_boxes(box)
			
 
				+            if s_side < self.min_size + 2:
			
 
				+                continue
			
 
				+            box = np.array(box)
			
 
				+
			
 
				+            box[:, 0] = np.clip(
			
 
				+                np.round(box[:, 0] / width * dest_width), 0, dest_width)
			
 
				+            box[:, 1] = np.clip(
			
 
				+                np.round(box[:, 1] / height * dest_height), 0, dest_height)
			
 
				+            boxes.append(box.astype("int32"))
			
 
				+            scores.append(score)
			
 
				+        return np.array(boxes, dtype="int32"), scores
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def unclip(box, unclip_ratio):
			
 
				+        poly = Polygon(box)
			
 
				+        distance = poly.area * unclip_ratio / poly.length
			
 
				+        offset = pyclipper.PyclipperOffset()
			
 
				+        offset.AddPath(box, pyclipper.JT_ROUND, pyclipper.ET_CLOSEDPOLYGON)
			
 
				+        expanded = np.array(offset.Execute(distance))
			
 
				+        return expanded
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def get_mini_boxes(contour):
			
 
				+        bounding_box = cv2.minAreaRect(contour)  # noqa
			
 
				+        points = sorted(list(cv2.boxPoints(bounding_box)), key=lambda x: x[0])  # noqa
			
 
				+
			
 
				+        if points[1][1] > points[0][1]:
			
 
				+            index_1 = 0
			
 
				+            index_4 = 1
			
 
				+        else:
			
 
				+            index_1 = 1
			
 
				+            index_4 = 0
			
 
				+        if points[3][1] > points[2][1]:
			
 
				+            index_2 = 2
			
 
				+            index_3 = 3
			
 
				+        else:
			
 
				+            index_2 = 3
			
 
				+            index_3 = 2
			
 
				+
			
 
				+        box = [points[index_1], points[index_2], points[index_3], points[index_4]]
			
 
				+        return box, min(bounding_box[1])
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def box_score_fast(bitmap, _box):
			
 
				+        """
			
 
				+        box_score_fast: use bbox mean score as the mean score
			
 
				+        """
			
 
				+        h, w = bitmap.shape[:2]
			
 
				+        box = _box.copy()
			
 
				+        x_min = np.clip(np.floor(box[:, 0].min()).astype("int32"), 0, w - 1)
			
 
				+        x_max = np.clip(np.ceil(box[:, 0].max()).astype("int32"), 0, w - 1)
			
 
				+        y_min = np.clip(np.floor(box[:, 1].min()).astype("int32"), 0, h - 1)
			
 
				+        y_max = np.clip(np.ceil(box[:, 1].max()).astype("int32"), 0, h - 1)
			
 
				+
			
 
				+        mask = np.zeros((y_max - y_min + 1, x_max - x_min + 1), dtype=np.uint8)
			
 
				+        box[:, 0] = box[:, 0] - x_min
			
 
				+        box[:, 1] = box[:, 1] - y_min
			
 
				+        cv2.fillPoly(mask, box.reshape(1, -1, 2).astype("int32"), 1)  # noqa
			
 
				+        return cv2.mean(bitmap[y_min:y_max + 1, x_min:x_max + 1], mask)[0]  # noqa
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def box_score_slow(bitmap, contour):
			
 
				+        """
			
 
				+        box_score_slow: use polyon mean score as the mean score
			
 
				+        """
			
 
				+        h, w = bitmap.shape[:2]
			
 
				+        contour = contour.copy()
			
 
				+        contour = np.reshape(contour, (-1, 2))
			
 
				+
			
 
				+        x_min = np.clip(np.min(contour[:, 0]), 0, w - 1)
			
 
				+        x_max = np.clip(np.max(contour[:, 0]), 0, w - 1)
			
 
				+        y_min = np.clip(np.min(contour[:, 1]), 0, h - 1)
			
 
				+        y_max = np.clip(np.max(contour[:, 1]), 0, h - 1)
			
 
				+
			
 
				+        mask = np.zeros((y_max - y_min + 1, x_max - x_min + 1), dtype=np.uint8)
			
 
				+
			
 
				+        contour[:, 0] = contour[:, 0] - x_min
			
 
				+        contour[:, 1] = contour[:, 1] - y_min
			
 
				+
			
 
				+        cv2.fillPoly(mask, contour.reshape(1, -1, 2).astype("int32"), 1)  # noqa
			
 
				+        return cv2.mean(bitmap[y_min:y_max + 1, x_min:x_max + 1], mask)[0]  # noqa
			
 
				+
			
 
				+    def __call__(self, outs_dict, shape_list):
			
 
				+        pred = outs_dict["maps"]
			
 
				+        if isinstance(pred, Tensor):
			
 
				+            pred = pred.numpy()
			
 
				+        pred = pred[:, 0, :, :]
			
 
				+        segmentation = pred > self.thresh
			
 
				+
			
 
				+        boxes_batch = []
			
 
				+        for batch_index in range(pred.shape[0]):
			
 
				+            src_h, src_w, ratio_h, ratio_w = shape_list[batch_index]
			
 
				+            if self.dilation_kernel is not None:
			
 
				+                mask = cv2.dilate(np.array(segmentation[batch_index]).astype(np.uint8), self.dilation_kernel)  # noqa
			
 
				+            else:
			
 
				+                mask = segmentation[batch_index]
			
 
				+            if self.box_type == "poly":
			
 
				+                boxes, scores = self.polygons_from_bitmap(pred[batch_index],
			
 
				+                                                          mask, src_w, src_h)
			
 
				+            elif self.box_type == "quad":
			
 
				+                boxes, scores = self.boxes_from_bitmap(pred[batch_index], mask,
			
 
				+                                                       src_w, src_h)
			
 
				+            else:
			
 
				+                raise ValueError("box_type can only be one of ['quad', 'poly']")
			
 
				+
			
 
				+            boxes_batch.append({"points": boxes})
			
 
				+        return boxes_batch
			
 
				+
			
 
				+
			
 
				+class ClsPostProcess:
			
 
				+    """ Convert between text-label and text-index """
			
 
				+
			
 
				+    def __init__(self, label_list=None):
			
 
				+        self.label_list = label_list
			
 
				+
			
 
				+    def __call__(self, preds, label=None, *args, **kwargs):
			
 
				+        label_list = self.label_list
			
 
				+        if label_list is None:
			
 
				+            label_list = {idx: idx for idx in range(preds.shape[-1])}
			
 
				+
			
 
				+        if isinstance(preds, Tensor):
			
 
				+            preds = preds.numpy()
			
 
				+
			
 
				+        pred_ids = preds.argmax(axis=1)
			
 
				+        decode_out = [(label_list[idx], preds[i, idx]) for i, idx in enumerate(pred_ids)]
			
 
				+        if label is None:
			
 
				+            return decode_out
			
 
				+        label = [(label_list[idx], 1.0) for idx in label]
			
 
				+        return decode_out, label
			
 
				+
			
 
				+
			
 
				+class __BaseRecDecoder:
			
 
				+    """ Convert between text-label and text-index """
			
 
				+
			
 
				+    def __init__(self, character_dict_path=None):
			
 
				+        self.beg_str = "sos"
			
 
				+        self.end_str = "eos"
			
 
				+        self.reverse = False
			
 
				+        self.character_str = []
			
 
				+
			
 
				+        if character_dict_path is None:
			
 
				+            self.character_str = "0123456789abcdefghijklmnopqrstuvwxyz "
			
 
				+            dict_character = list(self.character_str)
			
 
				+        else:
			
 
				+            with open(character_dict_path, "rb") as fin:
			
 
				+                lines = fin.readlines()
			
 
				+                for line in lines:
			
 
				+                    line = line.decode("utf-8").strip("\n").strip("\r\n")
			
 
				+                    self.character_str.append(line)
			
 
				+            self.character_str.append(" ")
			
 
				+            dict_character = list(self.character_str)
			
 
				+
			
 
				+        dict_character = self.add_special_char(dict_character)
			
 
				+        self.max_index = len(dict_character) - 1
			
 
				+        self.dict = {}
			
 
				+        for i, char in enumerate(dict_character):
			
 
				+            self.dict[char] = i
			
 
				+        self.character = dict_character
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def pred_reverse(pred):
			
 
				+        pred_re = []
			
 
				+        c_current = ""
			
 
				+        for c in pred:
			
 
				+            if not bool(re.search("[a-zA-Z0-9 :*./%+-]", c)):
			
 
				+                if c_current != "":
			
 
				+                    pred_re.append(c_current)
			
 
				+                pred_re.append(c)
			
 
				+                c_current = ""
			
 
				+            else:
			
 
				+                c_current += c
			
 
				+        if c_current != "":
			
 
				+            pred_re.append(c_current)
			
 
				+
			
 
				+        return "".join(pred_re[::-1])
			
 
				+
			
 
				+    def add_special_char(self, dict_character):
			
 
				+        return dict_character
			
 
				+
			
 
				+    def decode(self, text_index, text_prob=None, is_remove_duplicate=False, use_space=False):
			
 
				+        """ convert text-index into text-label. """
			
 
				+        result_list = []
			
 
				+        ignored_tokens = self.get_ignored_tokens()
			
 
				+        batch_size = len(text_index)
			
 
				+        for batch_idx in range(batch_size):
			
 
				+            selection = np.ones(len(text_index[batch_idx]), dtype=bool)
			
 
				+            if is_remove_duplicate:
			
 
				+                selection[1:] = text_index[batch_idx][1:] != text_index[batch_idx][:-1]
			
 
				+            for ignored_token in ignored_tokens:
			
 
				+                selection &= text_index[batch_idx] != ignored_token
			
 
				+
			
 
				+            char_list = []
			
 
				+            for index in text_index[batch_idx][selection]:
			
 
				+                if index == self.max_index and not use_space:
			
 
				+                    continue
			
 
				+                char_list.append(self.character[index])
			
 
				+            if text_prob is not None:
			
 
				+                conf_list = text_prob[batch_idx][selection]
			
 
				+            else:
			
 
				+                conf_list = [1] * len(selection)
			
 
				+            if len(conf_list) == 0:
			
 
				+                conf_list = [0]
			
 
				+
			
 
				+            text = "".join(char_list)
			
 
				+
			
 
				+            result_list.append((text, np.mean(conf_list).tolist()))
			
 
				+        return result_list
			
 
				+
			
 
				+    @staticmethod
			
 
				+    def get_ignored_tokens():
			
 
				+        return [0]  # for ctc blank
			
 
				+
			
 
				+
			
 
				+class CTCLabelDecode(__BaseRecDecoder):
			
 
				+    """ Convert between text-label and text-index """
			
 
				+
			
 
				+    def __init__(self, character_dict_path=None):
			
 
				+        super(CTCLabelDecode, self).__init__(character_dict_path)
			
 
				+
			
 
				+    def __call__(self, preds, use_space=False, *args, **kwargs):
			
 
				+        if isinstance(preds, tuple) or isinstance(preds, list):
			
 
				+            preds = preds[-1]
			
 
				+        if isinstance(preds, Tensor):
			
 
				+            preds = preds.numpy()
			
 
				+        preds_idx = preds.argmax(axis=2)
			
 
				+        preds_prob = preds.max(axis=2)
			
 
				+        return self.decode(preds_idx, preds_prob, is_remove_duplicate=True, use_space=use_space)
			
 
				+
			
 
				+    def add_special_char(self, dict_character):
			
 
				+        dict_character = ["blank"] + dict_character
			
 
				+        return dict_character
			
--- a/hmOCR/parts/recognizer.py
+++ b/hmOCR/parts/recognizer.py
@@ -0,0 +1,81 @@
 
				+import cv2
			
 
				+import math
			
 
				+import numpy as np
			
 
				+from .utils import *
			
 
				+from hmOCR.argument import Args
			
 
				+from .operator import CTCLabelDecode
			
 
				+
			
 
				+
			
 
				+class Recognizer:
			
 
				+    def __init__(self, args: "Args"):
			
 
				+        self.rec_image_shape = [int(v) for v in args.rec_image_shape.split(",")]
			
 
				+        self.rec_batch_num = args.rec_batch_num
			
 
				+        # rec_algorithm: only "SVTR_LCNet" now
			
 
				+        # self.rec_algorithm = args.rec_algorithm
			
 
				+
			
 
				+        self.post_op = CTCLabelDecode(args.rec_char_dict_path)
			
 
				+        self.predictor, self.input_tensor, self.output_tensors = create_predictor(args, "rec")
			
 
				+
			
 
				+    def resize_norm_img(self, img, max_wh_ratio):
			
 
				+        imgC, imgH, imgW = self.rec_image_shape
			
 
				+        assert imgC == img.shape[2]
			
 
				+        imgW = int((imgH * max_wh_ratio))
			
 
				+
			
 
				+        h, w = img.shape[:2]
			
 
				+        ratio = w / float(h)
			
 
				+        if math.ceil(imgH * ratio) > imgW:
			
 
				+            resized_w = imgW
			
 
				+        else:
			
 
				+            resized_w = int(math.ceil(imgH * ratio))
			
 
				+
			
 
				+        resized_image = cv2.resize(img, (resized_w, imgH))  # noqa
			
 
				+        resized_image = resized_image.astype("float32")
			
 
				+        resized_image = resized_image.transpose((2, 0, 1)) / 255
			
 
				+        resized_image -= 0.5
			
 
				+        resized_image /= 0.5
			
 
				+        padding_im = np.zeros((imgC, imgH, imgW), dtype=np.float32)
			
 
				+        padding_im[:, :, 0:resized_w] = resized_image
			
 
				+        return padding_im
			
 
				+
			
 
				+    def __call__(self, img_list, use_space=False):
			
 
				+        img_num = len(img_list)
			
 
				+        width_list = []
			
 
				+        for img in img_list:
			
 
				+            width_list.append(img.shape[1] / float(img.shape[0]))
			
 
				+        # Sorting can speed up the recognition process
			
 
				+        indices = np.argsort(np.array(width_list))
			
 
				+        rec_res = [["", 0.0]] * img_num
			
 
				+        batch_num = self.rec_batch_num
			
 
				+
			
 
				+        for beg_img_no in range(0, img_num, batch_num):
			
 
				+            end_img_no = min(img_num, beg_img_no + batch_num)
			
 
				+            norm_img_batch = []
			
 
				+
			
 
				+            imgC, imgH, imgW = self.rec_image_shape[:3]
			
 
				+            max_wh_ratio = imgW / imgH
			
 
				+            for ino in range(beg_img_no, end_img_no):
			
 
				+                h, w = img_list[indices[ino]].shape[0:2]
			
 
				+                wh_ratio = w * 1.0 / h
			
 
				+                max_wh_ratio = max(max_wh_ratio, wh_ratio)
			
 
				+            for ino in range(beg_img_no, end_img_no):
			
 
				+                norm_img = self.resize_norm_img(img_list[indices[ino]], max_wh_ratio)
			
 
				+                norm_img = norm_img[np.newaxis, :]
			
 
				+                norm_img_batch.append(norm_img)
			
 
				+            norm_img_batch = np.concatenate(norm_img_batch)
			
 
				+            norm_img_batch = norm_img_batch.copy()
			
 
				+
			
 
				+            self.input_tensor.copy_from_cpu(norm_img_batch)
			
 
				+            self.predictor.run()
			
 
				+            outputs = []
			
 
				+            for output_tensor in self.output_tensors:
			
 
				+                output = output_tensor.copy_to_cpu()
			
 
				+                outputs.append(output)
			
 
				+            if len(outputs) != 1:
			
 
				+                preds = outputs
			
 
				+            else:
			
 
				+                preds = outputs[0]
			
 
				+            rec_result = self.post_op(preds, use_space=use_space)
			
 
				+            for rno in range(len(rec_result)):
			
 
				+                rec_res[indices[beg_img_no + rno]] = rec_result[rno]
			
 
				+
			
 
				+        return rec_res
			
--- a/hmOCR/parts/utils.py
+++ b/hmOCR/parts/utils.py
@@ -0,0 +1,160 @@
 
				+from .operator import *  # noqa
			
 
				+from copy import deepcopy
			
 
				+from os import path, popen
			
 
				+from platform import system
			
 
				+from paddle import inference, fluid
			
 
				+
			
 
				+__all__ = ["create_operators", "build_post_process", "create_predictor", "transform"]
			
 
				+
			
 
				+
			
 
				+def create_operators(op_param_list):
			
 
				+    ops = []
			
 
				+    for operator in op_param_list:
			
 
				+        op_name = list(operator)[0]
			
 
				+        param = {} if operator[op_name] is None else operator[op_name]
			
 
				+        op = eval(op_name)(**param)
			
 
				+        ops.append(op)
			
 
				+    return ops
			
 
				+
			
 
				+
			
 
				+def transform(data, ops=None):
			
 
				+    if ops is None:
			
 
				+        ops = []
			
 
				+    for op in ops:
			
 
				+        data = op(data)
			
 
				+        if data is None:
			
 
				+            return None
			
 
				+    return data
			
 
				+
			
 
				+
			
 
				+def build_post_process(config):
			
 
				+    config = deepcopy(config)
			
 
				+    module_name = config.pop("name")
			
 
				+
			
 
				+    return eval(module_name)(**config)
			
 
				+
			
 
				+
			
 
				+def __get_gpu_id():
			
 
				+    if system() == "Windows":
			
 
				+        return 0
			
 
				+
			
 
				+    if not fluid.core.is_compiled_with_rocm():
			
 
				+        cmd = "env | grep CUDA_VISIBLE_DEVICES"
			
 
				+    else:
			
 
				+        cmd = "env | grep HIP_VISIBLE_DEVICES"
			
 
				+    env_cuda = popen(cmd).readlines()
			
 
				+    if len(env_cuda) == 0:
			
 
				+        return 0
			
 
				+    else:
			
 
				+        gpu_id = env_cuda[0].strip().split("=")[1]
			
 
				+        return int(gpu_id[0])
			
 
				+
			
 
				+
			
 
				+def __get_output_tensors(args, mode, predictor):
			
 
				+    output_names = predictor.get_output_names()
			
 
				+    output_tensors = []
			
 
				+    if mode == "rec" and args.rec_algorithm in ["CRNN", "SVTR_LCNet"]:
			
 
				+        output_name = "softmax_0.tmp_0"
			
 
				+        if output_name in output_names:
			
 
				+            return [predictor.get_output_handle(output_name)]
			
 
				+        else:
			
 
				+            for output_name in output_names:
			
 
				+                output_tensor = predictor.get_output_handle(output_name)
			
 
				+                output_tensors.append(output_tensor)
			
 
				+    else:
			
 
				+        for output_name in output_names:
			
 
				+            output_tensor = predictor.get_output_handle(output_name)
			
 
				+            output_tensors.append(output_tensor)
			
 
				+    return output_tensors
			
 
				+
			
 
				+
			
 
				+def create_predictor(args, mode):
			
 
				+    if mode == "det":
			
 
				+        model_dir = args.det_model_dir
			
 
				+    elif mode == "cls":
			
 
				+        model_dir = args.cls_model_dir
			
 
				+    else:  # rec
			
 
				+        model_dir = args.rec_model_dir
			
 
				+
			
 
				+    if model_dir is None:
			
 
				+        print("no model_dir defined in args")
			
 
				+        exit(0)
			
 
				+
			
 
				+    file_names, model_path, param_path = ["model", "inference"], None, None
			
 
				+    for file_name in file_names:
			
 
				+        model_file_path = path.join(model_dir, f"{file_name}.pdmodel")
			
 
				+        params_file_path = path.join(model_dir, f"{file_name}.pdiparams")
			
 
				+        if path.exists(model_file_path) and path.exists(params_file_path):
			
 
				+            model_path, param_path = model_file_path, params_file_path
			
 
				+            break
			
 
				+    if model_path is None:
			
 
				+        raise ValueError(f"not find model.pdmodel or inference.pdmodel in {model_dir}")
			
 
				+    if param_path is None:
			
 
				+        raise ValueError(f"not find model.pdiparams or inference.pdiparams in {model_dir}")
			
 
				+
			
 
				+    config = inference.Config(model_path, param_path)
			
 
				+
			
 
				+    precision = inference.PrecisionType.Float32
			
 
				+    if hasattr(args, "precision"):
			
 
				+        if args.precision == "fp16" and args.use_tensorrt:
			
 
				+            precision = inference.PrecisionType.Half
			
 
				+        elif args.precision == "int8":
			
 
				+            precision = inference.PrecisionType.Int8
			
 
				+        else:
			
 
				+            precision = inference.PrecisionType.Float32
			
 
				+
			
 
				+    if args.use_gpu:
			
 
				+        gpu_id = __get_gpu_id()
			
 
				+        if gpu_id is None:
			
 
				+            print(
			
 
				+                "WARING:",
			
 
				+                "GPU is not found in current device by nvidia-smi.",
			
 
				+                "Please check your device or ignore it if run on jetson."
			
 
				+            )
			
 
				+        config.enable_use_gpu(args.gpu_mem, 0)
			
 
				+        if args.use_tensorrt:
			
 
				+            config.enable_tensorrt_engine(
			
 
				+                workspace_size=1 << 30,
			
 
				+                precision_mode=precision,
			
 
				+                max_batch_size=args.max_batch_size,
			
 
				+                min_subgraph_size=args.min_subgraph_size,  # skip the minmum trt subgraph
			
 
				+                use_calib_mode=False
			
 
				+            )
			
 
				+
			
 
				+            # collect shape
			
 
				+            trt_shape_f = path.join(model_dir, f"{mode}_trt_dynamic_shape.txt")
			
 
				+
			
 
				+            if not path.exists(trt_shape_f):
			
 
				+                config.collect_shape_range_info(trt_shape_f)
			
 
				+                print(f"collect dynamic shape info into : {trt_shape_f}")
			
 
				+            try:
			
 
				+                config.enable_tuned_tensorrt_dynamic_shape(trt_shape_f, True)
			
 
				+            except Exception as E:
			
 
				+                print(E)
			
 
				+                print("Please keep your paddlepaddle-gpu >= 2.3.0!")
			
 
				+    else:
			
 
				+        config.disable_gpu()
			
 
				+        if args.enable_mkldnn:
			
 
				+            config.set_mkldnn_cache_capacity(10)
			
 
				+            config.enable_mkldnn()
			
 
				+            if hasattr(args, "cpu_threads"):
			
 
				+                config.set_cpu_math_library_num_threads(args.cpu_threads)
			
 
				+            else:
			
 
				+                config.set_cpu_math_library_num_threads(10)
			
 
				+
			
 
				+    config.enable_memory_optim()
			
 
				+    config.disable_glog_info()
			
 
				+    config.delete_pass("conv_transpose_eltwiseadd_bn_fuse_pass")
			
 
				+    config.delete_pass("matmul_transpose_reshape_fuse_pass")
			
 
				+
			
 
				+    config.switch_use_feed_fetch_ops(False)
			
 
				+    config.switch_ir_optim(True)
			
 
				+
			
 
				+    predictor = inference.create_predictor(config)
			
 
				+    input_names = predictor.get_input_names()
			
 
				+
			
 
				+    input_tensor = None
			
 
				+    for name in input_names:
			
 
				+        input_tensor = predictor.get_input_handle(name)
			
 
				+    output_tensors = __get_output_tensors(args, mode, predictor)
			
 
				+    return predictor, input_tensor, output_tensors
			
--- a/hmOCR/static/cls/inference.pdiparams
+++ b/hmOCR/static/cls/inference.pdiparams
--- a/hmOCR/static/cls/inference.pdiparams.info
+++ b/hmOCR/static/cls/inference.pdiparams.info
--- a/hmOCR/static/cls/inference.pdmodel
+++ b/hmOCR/static/cls/inference.pdmodel
--- a/hmOCR/static/det/inference.pdiparams
+++ b/hmOCR/static/det/inference.pdiparams
--- a/hmOCR/static/det/inference.pdiparams.info
+++ b/hmOCR/static/det/inference.pdiparams.info
--- a/hmOCR/static/det/inference.pdmodel
+++ b/hmOCR/static/det/inference.pdmodel
--- a/hmOCR/static/key-set.txt
+++ b/hmOCR/static/key-set.txt
--- a/hmOCR/static/rec/inference.pdiparams
+++ b/hmOCR/static/rec/inference.pdiparams
--- a/hmOCR/static/rec/inference.pdiparams.info
+++ b/hmOCR/static/rec/inference.pdiparams.info
--- a/hmOCR/static/rec/inference.pdmodel
+++ b/hmOCR/static/rec/inference.pdmodel
--- a/hmOCR/static/test_image/01.jpg
+++ b/hmOCR/static/test_image/01.jpg
--- a/hmOCR/static/test_image/02.jpg
+++ b/hmOCR/static/test_image/02.jpg
--- a/hmOCR/static/test_image/03.jpg
+++ b/hmOCR/static/test_image/03.jpg
--- a/hmOCR/static/test_image/04.jpg
+++ b/hmOCR/static/test_image/04.jpg
--- a/hmOCR/utility.py
+++ b/hmOCR/utility.py
@@ -0,0 +1,109 @@
 
				+import cv2
			
 
				+import numpy as np
			
 
				+from os import path, listdir
			
 
				+
			
 
				+__all__ = [
			
 
				+    "sorted_boxes", "get_rotate_crop_image", "get_min_area_rect_crop",
			
 
				+    "get_image_file_list", "check_and_read"
			
 
				+]
			
 
				+
			
 
				+
			
 
				+def sorted_boxes(dt_boxes):
			
 
				+    num_boxes = dt_boxes.shape[0]
			
 
				+    _sorted_boxes = sorted(dt_boxes, key=lambda x: (x[0][1], x[0][0]))
			
 
				+    _boxes = list(_sorted_boxes)
			
 
				+
			
 
				+    for i in range(num_boxes - 1):
			
 
				+        for j in range(i, -1, -1):
			
 
				+            if abs(_boxes[j + 1][0][1] - _boxes[j][0][1]) < 10 and (_boxes[j + 1][0][0] < _boxes[j][0][0]):
			
 
				+                tmp = _boxes[j]
			
 
				+                _boxes[j] = _boxes[j + 1]  # noqa
			
 
				+                _boxes[j + 1] = tmp
			
 
				+            else:
			
 
				+                break
			
 
				+    return _boxes
			
 
				+
			
 
				+
			
 
				+def get_rotate_crop_image(img, points):
			
 
				+    """
			
 
				+    img_height, img_width = img.shape[0:2]
			
 
				+    left = int(np.min(points[:, 0]))
			
 
				+    right = int(np.max(points[:, 0]))
			
 
				+    top = int(np.min(points[:, 1]))
			
 
				+    bottom = int(np.max(points[:, 1]))
			
 
				+    img_crop = img[top:bottom, left:right, :].copy()
			
 
				+    points[:, 0] = points[:, 0] - left
			
 
				+    points[:, 1] = points[:, 1] - top
			
 
				+    """
			
 
				+    assert len(points) == 4, "shape of points must be 4*2"
			
 
				+    img_crop_width = int(max(np.linalg.norm(points[0] - points[1]), np.linalg.norm(points[2] - points[3])))
			
 
				+    img_crop_height = int(max(np.linalg.norm(points[0] - points[3]), np.linalg.norm(points[1] - points[2])))
			
 
				+    pts_std = np.float32([[0, 0], [img_crop_width, 0], [img_crop_width, img_crop_height], [0, img_crop_height]])
			
 
				+    M = cv2.getPerspectiveTransform(points, pts_std)  # noqa
			
 
				+    dst_img = cv2.warpPerspective(  # noqa
			
 
				+        img, M, (img_crop_width, img_crop_height),
			
 
				+        borderMode=cv2.BORDER_REPLICATE, flags=cv2.INTER_CUBIC  # noqa
			
 
				+    )
			
 
				+    dst_img_height, dst_img_width = dst_img.shape[0:2]
			
 
				+    if dst_img_height * 1.0 / dst_img_width >= 1.5:
			
 
				+        dst_img = np.rot90(dst_img)
			
 
				+    return dst_img
			
 
				+
			
 
				+
			
 
				+def get_min_area_rect_crop(img, points):
			
 
				+    bounding_box = cv2.minAreaRect(np.array(points).astype(np.int32))  # noqa
			
 
				+    points = sorted(list(cv2.boxPoints(bounding_box)), key=lambda x: x[0])  # noqa
			
 
				+
			
 
				+    if points[1][1] > points[0][1]:
			
 
				+        index_a = 0
			
 
				+        index_d = 1
			
 
				+    else:
			
 
				+        index_a = 1
			
 
				+        index_d = 0
			
 
				+    if points[3][1] > points[2][1]:
			
 
				+        index_b = 2
			
 
				+        index_c = 3
			
 
				+    else:
			
 
				+        index_b = 3
			
 
				+        index_c = 2
			
 
				+
			
 
				+    box = [points[index_a], points[index_b], points[index_c], points[index_d]]
			
 
				+    crop_img = get_rotate_crop_image(img, np.array(box))
			
 
				+    return crop_img
			
 
				+
			
 
				+
			
 
				+def _check_image_file(file_path):
			
 
				+    img_end = ("jpg", "bmp", "png", "jpeg", "rgb", "tif", "tiff", "gif")
			
 
				+    return any([file_path.lower().endswith(e) for e in img_end])
			
 
				+
			
 
				+
			
 
				+def get_image_file_list(img_file):
			
 
				+    images = []
			
 
				+    if img_file is None or not path.exists(img_file):
			
 
				+        raise Exception(f"not found any img file in {img_file}")
			
 
				+
			
 
				+    if path.isfile(img_file) and _check_image_file(img_file):
			
 
				+        images.append(img_file)
			
 
				+    elif path.isdir(img_file):
			
 
				+        for single_file in listdir(img_file):
			
 
				+            file_path = path.join(img_file, single_file)
			
 
				+            if path.isfile(file_path) and _check_image_file(file_path):
			
 
				+                images.append(file_path)
			
 
				+    if len(images) == 0:
			
 
				+        raise Exception(f"not found any img file in {img_file}")
			
 
				+    images = sorted(images)
			
 
				+    return images
			
 
				+
			
 
				+
			
 
				+def check_and_read(img_path):
			
 
				+    if path.basename(img_path)[-3:].lower() == "gif":
			
 
				+        gif = cv2.VideoCapture(img_path)  # noqa
			
 
				+        ret, frame = gif.read()
			
 
				+        if not ret:
			
 
				+            print(f"Cannot read {img_path}. This gif image maybe corrupted.")
			
 
				+            return None, False
			
 
				+        if len(frame.shape) == 2 or frame.shape[-1] == 1:
			
 
				+            frame = cv2.cvtColor(frame, cv2.COLOR_GRAY2RGB)  # noqa
			
 
				+        img = frame[:, :, ::-1]
			
 
				+        return img, True
			
 
				+    return None, False
			
--- a/requires.cpu
+++ b/requires.cpu
@@ -0,0 +1,10 @@
 
				+paddlepaddle==2.4.2
			
 
				+
			
 
				+opencv-python==4.6.0.66
			
 
				+pyclipper==1.3.0.post4
			
 
				+urllib3==1.26.15
			
 
				+shapely==2.0.1
			
 
				+
			
 
				+flask==2.3.1
			
 
				+gevent==22.10.2
			
 
				+gunicorn==20.1.0
			
--- a/static/html/common.svg
+++ b/static/html/common.svg
--- a/static/html/favicon.png
+++ b/static/html/favicon.png
--- a/static/html/identity.svg
+++ b/static/html/identity.svg
@@ -0,0 +1,11 @@
 
				+<?xml version="1.0" standalone="no"?>
			
 
				+<svg viewBox="0 0 1024 1024" version="1.1" xmlns="http://www.w3.org/2000/svg" width="128" height="128">
			
 
				+    <path d="M903.56 847.62H120.44c-30.89 0-55.94-25.04-55.94-55.94V232.31c0-30.89 25.04-55.94 55.94-55.94h783.12c30.89 0 55.94 25.04 55.94 55.94v559.38c0 30.89-25.04 55.93-55.94 55.93z"
			
 
				+          fill="#8C9EFF"/>
			
 
				+    <path d="M847.63 421.1H651.84c-11.59 0-20.98-9.39-20.98-20.98s9.39-20.98 20.98-20.98h195.78c11.59 0 20.98 9.39 20.98 20.98s-9.39 20.98-20.97 20.98zM847.63 532.97H651.84c-11.59 0-20.98-9.39-20.98-20.98s9.39-20.98 20.98-20.98h195.78c11.59 0 20.98 9.39 20.98 20.98s-9.39 20.98-20.97 20.98zM763.72 644.85H651.84c-11.59 0-20.98-9.39-20.98-20.98s9.39-20.98 20.98-20.98h111.88c11.59 0 20.98 9.39 20.98 20.98s-9.39 20.98-20.98 20.98z"
			
 
				+          fill="#E1F5FF"/>
			
 
				+    <path d="M344.19 410.61m-78.66 0a78.66 78.66 0 1 0 157.32 0 78.66 78.66 0 1 0-157.32 0Z"
			
 
				+          fill="#FFD600"/>
			
 
				+    <path d="M487.09 692.05c16.25 0 28.15-12.94 24.12-26.22-21.14-69.7-87.9-120.62-167.02-120.62-79.13 0-145.88 50.92-167.02 120.62-4.03 13.28 7.88 26.22 24.12 26.22h285.8z"
			
 
				+          fill="#FFD600"/>
			
 
				+</svg>
			
--- a/static/html/more.svg
+++ b/static/html/more.svg
--- a/templates/com_index.html
+++ b/templates/com_index.html
@@ -0,0 +1,27 @@
 
				+<!DOCTYPE html>
			
 
				+<html lang="zh">
			
 
				+<head>
			
 
				+    <meta charset="UTF-8">
			
 
				+    <title>upload index</title>
			
 
				+</head>
			
 
				+<body>
			
 
				+<h2>原始OCR：</h2>
			
 
				+<form action="/com/" method="POST" enctype="multipart/form-data">
			
 
				+    <input type="file" name="picture">
			
 
				+    <input type="text" name="type" value="raw" hidden>
			
 
				+    <input type="submit" value="上传并识别">
			
 
				+</form>
			
 
				+<h2>过滤结果：</h2>
			
 
				+<form action="/com/" method="POST" enctype="multipart/form-data">
			
 
				+    <input type="file" name="picture">
			
 
				+    <input type="text" name="type" value="filter" hidden>
			
 
				+    <input type="submit" value="上传并识别">
			
 
				+</form>
			
 
				+<h2>在线演示：</h2>
			
 
				+<form action="/com/" method="POST" enctype="multipart/form-data">
			
 
				+    <input type="file" name="picture">
			
 
				+    <input type="text" name="type" value="html" hidden>
			
 
				+    <input type="submit" value="上传并识别">
			
 
				+</form>
			
 
				+</body>
			
 
				+</html>
			
--- a/templates/com_result.html
+++ b/templates/com_result.html
@@ -0,0 +1,88 @@
 
				+<!DOCTYPE html>
			
 
				+<html lang="zh">
			
 
				+<head>
			
 
				+    <meta charset="UTF-8">
			
 
				+    <title>通用OCR结果展示</title>
			
 
				+    <style>
			
 
				+        html, body {
			
 
				+            width: 100%;
			
 
				+            padding: 0;
			
 
				+            margin: 0;
			
 
				+        }
			
 
				+
			
 
				+        .img-line {
			
 
				+            width: 100%;
			
 
				+            box-sizing: border-box;
			
 
				+            display: flex;
			
 
				+            justify-content: center;
			
 
				+            margin-top: 50px;
			
 
				+        }
			
 
				+
			
 
				+        img {
			
 
				+            width: 600px;
			
 
				+            height: auto;
			
 
				+            box-sizing: border-box;
			
 
				+            padding: 5px;
			
 
				+            border: 1px solid #000;
			
 
				+        }
			
 
				+
			
 
				+        .data-table {
			
 
				+            width: 100%;
			
 
				+            justify-content: center;
			
 
				+            box-sizing: border-box;
			
 
				+            margin: 50px 0;
			
 
				+            padding: 0 20px;
			
 
				+        }
			
 
				+
			
 
				+        table {
			
 
				+            width: 100%;
			
 
				+            border: none;
			
 
				+            background-color: aqua;
			
 
				+        }
			
 
				+
			
 
				+        .col1 {
			
 
				+            text-align: center;
			
 
				+            width: 5%;
			
 
				+        }
			
 
				+
			
 
				+        .col2 {
			
 
				+            width: 80%;
			
 
				+        }
			
 
				+
			
 
				+        .col3 {
			
 
				+            width: 15%;
			
 
				+        }
			
 
				+
			
 
				+        td, th {
			
 
				+            background-color: white;
			
 
				+        }
			
 
				+    </style>
			
 
				+</head>
			
 
				+<body>
			
 
				+<div class="img-line">
			
 
				+    <a target="_blank" href="/{{ raw }}">
			
 
				+        <img src="/{{ raw }}" alt="raw">
			
 
				+    </a>
			
 
				+</div>
			
 
				+<div class="data-table">
			
 
				+    <table>
			
 
				+        <thead>
			
 
				+        <tr>
			
 
				+            <th class="col1">序号</th>
			
 
				+            <th class="col2">内容</th>
			
 
				+            <th class="col3">概率</th>
			
 
				+        </tr>
			
 
				+        </thead>
			
 
				+        <tbody>
			
 
				+        {% for item in data %}
			
 
				+            <tr>
			
 
				+                <td class="col1">{{ item.index }}</td>
			
 
				+                <td class="col2">{{ item.word }}</td>
			
 
				+                <td class="col3">{{ item.rate }}</td>
			
 
				+            </tr>
			
 
				+        {% endfor %}
			
 
				+        </tbody>
			
 
				+    </table>
			
 
				+</div>
			
 
				+</body>
			
 
				+</html>
			
--- a/templates/idc_index.html
+++ b/templates/idc_index.html
@@ -0,0 +1,33 @@
 
				+<!DOCTYPE html>
			
 
				+<html lang="zh">
			
 
				+<head>
			
 
				+    <meta charset="UTF-8">
			
 
				+    <title>upload index</title>
			
 
				+</head>
			
 
				+<body>
			
 
				+<h2>API 人像面：</h2>
			
 
				+<form action="/idc/" method="POST" enctype="multipart/form-data">
			
 
				+    <input type="file" name="picture">
			
 
				+    <input type="text" name="which" value="face" hidden>
			
 
				+    <input type="submit" value="上传并识别">
			
 
				+</form>
			
 
				+<h2>API 国徽面：</h2>
			
 
				+<form action="/idc/" method="POST" enctype="multipart/form-data">
			
 
				+    <input type="file" name="picture">
			
 
				+    <input type="text" name="which" value="icon" hidden>
			
 
				+    <input type="submit" value="上传并识别">
			
 
				+</form>
			
 
				+<h2>在线 人像面：</h2>
			
 
				+<form action="/idc/html/" method="POST" enctype="multipart/form-data">
			
 
				+    <input type="file" name="picture">
			
 
				+    <input type="text" name="which" value="face" hidden>
			
 
				+    <input type="submit" value="上传并识别">
			
 
				+</form>
			
 
				+<h2>在线 国徽面：</h2>
			
 
				+<form action="/idc/html/" method="POST" enctype="multipart/form-data">
			
 
				+    <input type="file" name="picture">
			
 
				+    <input type="text" name="which" value="icon" hidden>
			
 
				+    <input type="submit" value="上传并识别">
			
 
				+</form>
			
 
				+</body>
			
 
				+</html>
			
--- a/templates/k-v_result.html
+++ b/templates/k-v_result.html
@@ -0,0 +1,85 @@
 
				+<!DOCTYPE html>
			
 
				+<html lang="zh">
			
 
				+<head>
			
 
				+    <meta charset="UTF-8">
			
 
				+    <title>键值对OCR结果展示</title>
			
 
				+    <style>
			
 
				+        html, body {
			
 
				+            width: 100%;
			
 
				+            padding: 0;
			
 
				+            margin: 0;
			
 
				+        }
			
 
				+
			
 
				+        .img-line {
			
 
				+            width: 100%;
			
 
				+            box-sizing: border-box;
			
 
				+            display: flex;
			
 
				+            justify-content: center;
			
 
				+            margin-top: 50px;
			
 
				+        }
			
 
				+
			
 
				+        img {
			
 
				+            width: 600px;
			
 
				+            height: auto;
			
 
				+            box-sizing: border-box;
			
 
				+            padding: 5px;
			
 
				+            border: 1px solid #000;
			
 
				+        }
			
 
				+
			
 
				+        .data-table {
			
 
				+            width: 100%;
			
 
				+            justify-content: center;
			
 
				+            box-sizing: border-box;
			
 
				+            margin: 50px 0;
			
 
				+            padding: 0 20px;
			
 
				+        }
			
 
				+
			
 
				+        table {
			
 
				+            width: 100%;
			
 
				+            border: none;
			
 
				+            background-color: aqua;
			
 
				+        }
			
 
				+
			
 
				+        .col-key {
			
 
				+            width: 20%;
			
 
				+        }
			
 
				+
			
 
				+        .col-value {
			
 
				+            width: 80%;
			
 
				+        }
			
 
				+
			
 
				+        td, th {
			
 
				+            background-color: white;
			
 
				+        }
			
 
				+
			
 
				+        .center {
			
 
				+            text-align: center;
			
 
				+        }
			
 
				+    </style>
			
 
				+</head>
			
 
				+<body>
			
 
				+<div class="img-line">
			
 
				+    <a target="_blank" href="/{{ raw }}">
			
 
				+        <img src="/{{ raw }}" alt="raw">
			
 
				+    </a>
			
 
				+</div>
			
 
				+<div class="data-table">
			
 
				+    <table>
			
 
				+        <thead>
			
 
				+        <tr>
			
 
				+            <th class="col-key">JSON键</th>
			
 
				+            <th class="col-value">数据值</th>
			
 
				+        </tr>
			
 
				+        </thead>
			
 
				+        <tbody>
			
 
				+        {% for key, value in data.items() %}
			
 
				+            <tr>
			
 
				+                <td class="center">{{ key }}</td>
			
 
				+                <td>{{ value }}</td>
			
 
				+            </tr>
			
 
				+        {% endfor %}
			
 
				+        </tbody>
			
 
				+    </table>
			
 
				+</div>
			
 
				+</body>
			
 
				+</html>
			
--- a/templates/navigate.html
+++ b/templates/navigate.html
@@ -0,0 +1,77 @@
 
				+<!DOCTYPE html>
			
 
				+<html lang="zh">
			
 
				+<head>
			
 
				+    <meta charset="UTF-8">
			
 
				+    <title>HuiMv OCR Navigator</title>
			
 
				+    <style>
			
 
				+        html, body {
			
 
				+            width: 100%;
			
 
				+            background-color: #eeeeee;
			
 
				+            margin: 0;
			
 
				+            padding: 0;
			
 
				+        }
			
 
				+
			
 
				+        h1 {
			
 
				+            padding-left: 50px;
			
 
				+            margin-bottom: 40px;
			
 
				+        }
			
 
				+
			
 
				+        .demos {
			
 
				+            width: 100%;
			
 
				+            display: flex;
			
 
				+            justify-content: space-evenly;
			
 
				+
			
 
				+            box-sizing: border-box;
			
 
				+            padding: 20px 100px;
			
 
				+        }
			
 
				+
			
 
				+        .demo {
			
 
				+            width: 220px;
			
 
				+            height: 260px;
			
 
				+            border: 1px solid #000000;
			
 
				+            background-color: white;
			
 
				+            border-radius: 4px;
			
 
				+            cursor: pointer;
			
 
				+            display: flex;
			
 
				+            flex-direction: column;
			
 
				+            align-items: center;
			
 
				+            box-sizing: border-box;
			
 
				+            padding: 4px;
			
 
				+        }
			
 
				+
			
 
				+        .demo > img {
			
 
				+            width: 220px;
			
 
				+            height: 150px;
			
 
				+            margin-bottom: 10px;
			
 
				+            border-bottom: 1px solid gray;
			
 
				+            box-sizing: border-box;
			
 
				+            padding: 20px;
			
 
				+        }
			
 
				+
			
 
				+
			
 
				+    </style>
			
 
				+</head>
			
 
				+<body>
			
 
				+<h1>HuiMv OCR Navigator</h1>
			
 
				+<div class="demos">
			
 
				+    <div rel="/com" class="demo link">
			
 
				+        <img src="/static/html/common.svg" alt="common">
			
 
				+        <span>通用内容识别模型，可识别任意图片中的所有文字内容,对图片要求不高。</span>
			
 
				+    </div>
			
 
				+    <div rel="/idc" class="demo link">
			
 
				+        <img src="/static/html/identity.svg" alt="identity">
			
 
				+        <span>中国大陆身份证内容识别，主要识别：姓名、性别、民族、身份证号、地址、有效日期。</span>
			
 
				+    </div>
			
 
				+    <div class="demo">
			
 
				+        <img src="/static/html/more.svg" alt="more">
			
 
				+        <span>更多内容，有待开发...<br>更多内容，有待开发...<br>更多内容，有待开发...</span>
			
 
				+    </div>
			
 
				+</div>
			
 
				+<script>
			
 
				+    let $links = document.getElementsByClassName("link");
			
 
				+    for (let $link of $links) $link.onclick = function () {
			
 
				+        window.location.href = this.getAttribute("rel");
			
 
				+    }
			
 
				+</script>
			
 
				+</body>
			
 
				+</html>
			
--- a/utils/__init__.py
+++ b/utils/__init__.py
@@ -0,0 +1 @@
 
				+from .util import *
			
--- a/utils/conf.py
+++ b/utils/conf.py
@@ -0,0 +1,7 @@
 
				+MAX_CONTENT_LENGTH = 5 * 1024 * 1024  # 5M图片
			
 
				+DEBUG = False
			
 
				+JSON_AS_ASCII = False
			
 
				+TEMPLATES_AUTO_RELOAD = True
			
 
				+
			
 
				+SERVER_HOST = "0.0.0.0"
			
 
				+SERVER_PORT = 5050
			
--- a/utils/util.py
+++ b/utils/util.py
@@ -0,0 +1,80 @@
 
				+import cv2
			
 
				+import numpy as np
			
 
				+from typing import Union
			
 
				+from flask import jsonify
			
 
				+from random import randint
			
 
				+from hmOCR import HuiMvOcr, Args
			
 
				+from time import localtime, strftime
			
 
				+
			
 
				+__all__ = [
			
 
				+    "Response", "rand_str", "current_time", "get_ext_name", "is_image_ext",
			
 
				+    "json_all", "str_include", "read_img", "rot_img", "save_img", "Engine"
			
 
				+]
			
 
				+
			
 
				+__StrBase = "qwertyuioplkjhgfdsazxcvbnm1234567890ZXCVBNMLKJHGFDSAQWERTYUIOP"
			
 
				+__StrBaseLen = len(__StrBase) - 1
			
 
				+__AcceptExtNames = ["jpg", "jpeg", "bmp", "png", "rgb", "tif", "tiff", "gif", "pdf"]
			
 
				+Engine = HuiMvOcr(Args())
			
 
				+
			
 
				+
			
 
				+def Response(message: "str" = None, data=None):
			
 
				+    if message is None:
			
 
				+        return jsonify(success=True, message="操作成功", data=data)
			
 
				+    return jsonify(success=False, message=message, data=data)
			
 
				+
			
 
				+
			
 
				+def rand_str(size: "int" = 8) -> "str":
			
 
				+    return "".join([__StrBase[randint(0, __StrBaseLen)] for _ in range(size)])
			
 
				+
			
 
				+
			
 
				+def current_time() -> "str":
			
 
				+    return strftime("%Y-%m-%d_%H-%M-%S", localtime())
			
 
				+
			
 
				+
			
 
				+def get_ext_name(name: "str") -> "str":
			
 
				+    return name.split(".")[-1].lower()
			
 
				+
			
 
				+
			
 
				+def is_image_ext(ext: "str") -> bool:
			
 
				+    return ext in __AcceptExtNames
			
 
				+
			
 
				+
			
 
				+def json_all(data: "Union[list, dict]") -> "bool":
			
 
				+    if isinstance(data, list):
			
 
				+        for item in data:
			
 
				+            if isinstance(item, str) and not item:
			
 
				+                return False
			
 
				+            elif isinstance(item, (list, dict)) and not json_all(item):
			
 
				+                return False
			
 
				+        return True
			
 
				+    elif isinstance(data, dict):
			
 
				+        for value in data.values():
			
 
				+            if isinstance(value, str) and not value:
			
 
				+                return False
			
 
				+            elif isinstance(value, (list, dict)) and not json_all(value):
			
 
				+                return False
			
 
				+        return True
			
 
				+    raise TypeError(f"except node type are: [list, dict], but got a {type(data)} instead.")
			
 
				+
			
 
				+
			
 
				+def str_include(str_long: "str", str_short: "str") -> "bool":
			
 
				+    for it in str_short:
			
 
				+        if it not in str_long:
			
 
				+            return False
			
 
				+    return True
			
 
				+
			
 
				+
			
 
				+def read_img(content: "str") -> "np.ndarray":
			
 
				+    return cv2.imdecode(np.fromstring(content, np.uint8), 1)  # noqa
			
 
				+
			
 
				+
			
 
				+def rot_img(img: "np.ndarray") -> "list[np.ndarray]":
			
 
				+    return [img, np.rot90(img), np.rot90(img, 2), np.rot90(img, 3)]
			
 
				+
			
 
				+
			
 
				+def save_img(filename: "str", content: "Union[bytes, np.ndarray]"):
			
 
				+    if isinstance(content, np.ndarray):
			
 
				+        return cv2.imwrite(filename, content)  # noqa
			
 
				+    with open(filename, "wb") as fp:
			
 
				+        fp.write(content)
			
 
				+        fp.close()