ocr_yolo triton-inference-server

乔峰昇
Showing 11 changed files with 308 additions and 0 deletions
.gitignore
OCR_Engine
README.md
bank_ocr_inference.py
triton_pipeline.py
yolov5_onnx_demo/api/yolov5_onnx_server.py
yolov5_onnx_demo/api_test.py
yolov5_onnx_demo/model/__init__.py
yolov5_onnx_demo/model/__pycache__/__init__.cpython-36.pyc
yolov5_onnx_demo/model/__pycache__/yolov5_infer.cpython-36.pyc
yolov5_onnx_demo/model/yolov5_infer.py
--- a/.gitignore 0 → 100644
View file @d479b4e
+++ b/.gitignore 0 → 100644
View file @d479b4e
+model_repository/
+.idea/
--- a/OCR_Engine @ 3dddc11a
+++ b/OCR_Engine @ 3dddc11a
+Subproject commit 3dddc11a8a1d369ca4fbd0b69e4e21e6af81cc4c
--- a/README.md 0 → 100644
View file @d479b4e
+++ b/README.md 0 → 100644
View file @d479b4e
+## OCR+yolov5  triton-inference-server服务
+
+1.使用docker启动triton服务
+
+    sudo docker run --gpus="device=0" --rm -p 8000:8000 -p 8001:8001 -p 8002:8002 -v /home/situ/qfs/triton_inference_server/demo/model_repository:/models nvcr.io/nvidia/tritonserver:21.10-py3 tritonserver --model-repository=/models
+    
+2.分别启动OCR和yolov5的web服务
+
+    cd OCR_Engine/api
+    python ocr_engine_server.py
+
+    cd yolov5_onnx_demo/api
+    python yolov5_onnx_server.py
+
+3.pipeline测试
+
+    python triton_pipeline.py
+
--- a/bank_ocr_inference.py 0 → 100644
View file @d479b4e
+++ b/bank_ocr_inference.py 0 → 100644
View file @d479b4e
--- a/triton_pipeline.py 0 → 100644
View file @d479b4e
+++ b/triton_pipeline.py 0 → 100644
View file @d479b4e
+import base64
+import json
+from bank_ocr_inference import *
+
+
+def enlarge_position(box):
+    x1, y1, x2, y2 = box
+    w, h = abs(x2 - x1), abs(y2 - y1)
+    y1, y2 = max(y1 - h // 3, 0), y2 + h // 3
+    x1, x2 = max(x1 - w // 8, 0), x2 + w // 8
+    return [x1, y1, x2, y2]
+
+
+def path_base64(file_path):
+    f = open(file_path, 'rb')
+    file64 = base64.b64encode(f.read())  # image 64 bytes 类型
+    file64 = file64.decode('utf-8')
+    return file64
+
+
+def bgr_base64(image):
+    _, img64 = cv2.imencode('.jpg', image)
+    img64 = base64.b64encode(img64)
+    return img64.decode('utf-8')
+
+
+def base64_bgr(img64):
+    str_img64 = base64.b64decode(img64)
+    image = np.frombuffer(str_img64, np.uint8)
+    image = cv2.imdecode(image, cv2.IMREAD_COLOR)
+    return image
+
+
+def tamper_detect_(image):
+    img64 = bgr_base64(image)
+    resp = requests.post(url=r'http://192.168.10.11:8009/tamper_det', data=json.dumps({'img': img64}))
+    results = resp.json()
+    return results
+
+
+if __name__ == '__main__':
+    image = cv2.imread(
+        '/data/situ_invoice_bill_data/银行流水样本/普通打印-部分格线-竖版-农业银行-8列/_1594626974.367834page_20_img_0.jpg')
+    st = time.time()
+    ocr_results = bill_ocr(image)
+    et1 = time.time()
+    info_results = extract_bank_info(ocr_results)
+    et2 = time.time()
+    tamper_results = []
+    if len(info_results) != 0:
+        for info_result in info_results:
+            box = [info_result[1][0], info_result[1][1], info_result[1][4], info_result[1][5]]
+            x1, y1, x2, y2 = enlarge_position(box)
+            # x1, y1, x2, y2 = box
+            info_image = image[y1:y2, x1:x2, :]
+            results = tamper_detect_(info_image)
+            print(results)
+            if len(results['results']) != 0:
+                for res in results['results']:
+                    cx = int(res[0])
+                    cy = int(res[1])
+                    width = int(res[2])
+                    height = int(res[3])
+                    left = cx - width // 2
+                    top = cy - height // 2
+                    absolute_position = [x1 + left, y1 + top, x1 + left + width, y1 + top + height]
+                    # absolute_position = [x1+left, y1+top, x2, y2]
+                    tamper_results.append(absolute_position)
+    et3 = time.time()
+    print(tamper_results)
+
+    print(f'all time:{et3 - st}  ocr time:{et1 - st}  extract info time:{et2 - et1}  yolo time:{et3 - et2}')
+    for i in tamper_results:
+        cv2.rectangle(image, tuple(i[:2]), tuple(i[2:]), (0, 0, 255), 2)
+    cv2.imshow('info', image)
+    cv2.waitKey(0)
--- a/yolov5_onnx_demo/api/yolov5_onnx_server.py 0 → 100644
View file @d479b4e
+++ b/yolov5_onnx_demo/api/yolov5_onnx_server.py 0 → 100644
View file @d479b4e
+import base64
+
+import cv2
+import numpy as np
+from sanic import Sanic
+from sanic.response import json
+from yolov5_onnx_demo.model.yolov5_infer import *
+
+
+def base64_to_bgr(bs64):
+    img_data = base64.b64decode(bs64)
+    img_arr = np.fromstring(img_data, np.uint8)
+    img_np = cv2.imdecode(img_arr, cv2.IMREAD_COLOR)
+    return img_np
+
+
+app = Sanic('tamper_det')
+
+
+@app.post('/tamper_det')
+def hello(request):
+    d = request.json
+    print(d['img'])
+    img = base64_to_bgr(d['img'])
+    result = grpc_detect(img)
+
+    return json({'results': result})
+
+
+if __name__ == '__main__':
+    app.run(host='192.168.10.11', port=8009,workers=10)
--- a/yolov5_onnx_demo/api_test.py 0 → 100644
View file @d479b4e
+++ b/yolov5_onnx_demo/api_test.py 0 → 100644
View file @d479b4e
+import base64
+
+import requests
+import json
+from yolov5_onnx_demo.model.yolov5_infer import *
+
+def path_base64(file_path):
+    f = open(file_path, 'rb')
+    file64 = base64.b64encode(f.read())  # image 64 bytes 类型
+    file64 = file64.decode('utf-8')
+    return file64
+
+
+res = requests.post('http://192.168.10.11:8009/tamper_det', data=json.dumps(
+    {'img': path_base64('/data/situ_invoice_bill_data/qfs_train_val_data/train_data/machine/minsheng/images/train/_1597386625.07514page_20_img_0_machine_name_full_splicing.jpg')}))
+results = res.json()
+img = cv2.imread(
+        '/data/situ_invoice_bill_data/qfs_train_val_data/train_data/machine/minsheng/images/train/_1597386625.07514page_20_img_0_machine_name_full_splicing.jpg')
+print(res)
+plot_label(img,results['keys'])
--- a/yolov5_onnx_demo/model/__init__.py 0 → 100644
View file @d479b4e
+++ b/yolov5_onnx_demo/model/__init__.py 0 → 100644
View file @d479b4e
--- a/yolov5_onnx_demo/model/__pycache__/__init__.cpython-36.pyc 0 → 100644
View file @d479b4e
+++ b/yolov5_onnx_demo/model/__pycache__/__init__.cpython-36.pyc 0 → 100644
View file @d479b4e
--- a/yolov5_onnx_demo/model/__pycache__/yolov5_infer.cpython-36.pyc 0 → 100644
View file @d479b4e
+++ b/yolov5_onnx_demo/model/__pycache__/yolov5_infer.cpython-36.pyc 0 → 100644
View file @d479b4e
--- a/yolov5_onnx_demo/model/yolov5_infer.py 0 → 100644
View file @d479b4e
+++ b/yolov5_onnx_demo/model/yolov5_infer.py 0 → 100644
View file @d479b4e
+import cv2
+import numpy as np
+import tritonclient.grpc as grpcclient
+
+
+def keep_resize_padding(image):
+    '''
+    注意由于输入需要固定640*640的大小，而官方的推理为了加速采用了最小缩放比的方式进行
+    导致输入的尺寸不固定，重写resize方法，添加padding到640*640
+    '''
+    h, w, c = image.shape
+    if h >= w:
+        pad1 = (h - w) // 2
+        pad2 = h - w - pad1
+        p1 = np.ones((h, pad1, 3)) * 114.0
+        p2 = np.ones((h, pad2, 3)) * 114.0
+        p1, p2 = p1.astype(np.uint8), p2.astype(np.uint8)
+        new_image = np.hstack((p1, image, p2))
+        padding_info = [pad1, pad2, 0]
+    else:
+        pad1 = (w - h) // 2
+        pad2 = w - h - pad1
+        p1 = np.ones((pad1, w, 3)) * 114.0
+        p2 = np.ones((pad2, w, 3)) * 114.0
+        p1, p2 = p1.astype(np.uint8), p2.astype(np.uint8)
+        new_image = np.vstack((p1, image, p2))
+        padding_info = [pad1, pad2, 1]
+    new_image = cv2.resize(new_image, (640, 640))
+    return new_image, padding_info
+
+
+# remove padding
+def extract_authentic_bboxes(image, padding_info, bboxes):
+    '''
+    反算坐标信息
+    '''
+    pad1, pad2, pad_type = padding_info
+    h, w, c = image.shape
+    bboxes = np.array(bboxes)
+    max_slide = max(h, w)
+    scale = max_slide / 640
+    bboxes[:, :4] = bboxes[:, :4] * scale
+    if pad_type == 0:
+        bboxes[:, 0] = bboxes[:, 0] - pad1
+    else:
+        bboxes[:, 1] = bboxes[:, 1] - pad1
+    return bboxes.tolist()
+
+
+# NMS
+def py_nms_cpu(
+        prediction,
+        conf_thres=0.25,
+        iou_thres=0.45,
+):
+    """Non-Maximum Suppression (NMS) on inference results to reject overlapping detections
+
+    Returns:
+         list of detections, on (n,6) tensor per image [xyxy, conf, cls]
+    """
+    xc = prediction[..., 4] > conf_thres  # candidates
+    prediction = prediction[xc]
+
+    # MNS
+    x1 = prediction[..., 0] - prediction[..., 2] / 2
+    y1 = prediction[..., 1] - prediction[..., 3] / 2
+    x2 = prediction[..., 0] + prediction[..., 2] / 2
+    y2 = prediction[..., 1] + prediction[..., 3] / 2
+
+    areas = (x2 - x1 + 1) * (y2 - y1 + 1)
+    score = prediction[..., 5]
+    order = np.argsort(score)
+    keep = []
+    while order.size > 0:
+        i = order[0]
+        keep.append(i)
+
+        xx1 = np.maximum(x1[i], x1[order[1:]])
+        yy1 = np.maximum(y1[i], y1[order[1:]])
+        xx2 = np.minimum(x2[i], x2[order[1:]])
+        yy2 = np.minimum(y2[i], y2[order[1:]])
+
+        ww, hh = np.maximum(0, xx2 - xx1 + 1), np.maximum(0, yy2 - yy1 + 1)
+        inter = ww * hh
+
+        over = inter / (areas[i] + areas[order[1:]] - inter)
+
+        idx = np.where(over < iou_thres)[0]
+        order = order[idx + 1]
+
+    return prediction[keep]
+
+
+def client_init(url='localhost:8001',
+                ssl=False,
+                private_key=None,
+                root_certificates=None,
+                certificate_chain=None,
+                verbose=False):
+    triton_client = grpcclient.InferenceServerClient(
+        url=url,
+        verbose=verbose,  # 详细输出 默认是False
+        ssl=ssl,
+        root_certificates=root_certificates,
+        private_key=private_key,
+        certificate_chain=certificate_chain,
+    )
+    return triton_client
+
+
+triton_client = client_init('localhost:8001')
+compression_algorithm = None
+input_name = 'images'
+output_name = 'output0'
+model_name = 'yolov5'
+
+
+def grpc_detect(img):
+    image, padding_info = keep_resize_padding(img)
+    image = image.transpose((2, 0, 1))[::-1]
+    image = image.astype(np.float32)
+    image = image / 255.0
+    if len(image.shape) == 3:
+        image = image[None]
+
+    outputs, inputs = [], []
+
+    # 动态输入
+    input_shape = image.shape
+    inputs.append(grpcclient.InferInput(input_name, input_shape, 'FP32'))
+    outputs.append(grpcclient.InferRequestedOutput(output_name))
+
+    inputs[0].set_data_from_numpy(image.astype(np.float32))
+
+    pred = triton_client.infer(
+        model_name=model_name,
+        inputs=inputs, outputs=outputs,
+        compression_algorithm=compression_algorithm
+    )
+    pred = pred.as_numpy(output_name).copy()
+    result_bboxes = py_nms_cpu(pred)
+    result_bboxes = extract_authentic_bboxes(img, padding_info, result_bboxes)
+    return result_bboxes
+
+
+def plot_label(img, result_bboxes):
+    print(result_bboxes)
+    for bbox in result_bboxes:
+        x, y, w, h, conf, cls = bbox
+        cv2.rectangle(img, (int(x - w // 2), int(y - h // 2)), (int(x + w // 2), int(y + h // 2)), (0, 0, 255), 2)
+    cv2.imshow('im', img)
+    cv2.waitKey(0)
+
+
+if __name__ == '__main__':
+    img = cv2.imread(
+        '/data/situ_invoice_bill_data/qfs_train_val_data/train_data/authentic/gongshang/images/val/_1594890232.0110397page_11_img_0_name_au_gongshang.jpg')
+
+    result_bboxes = grpc_detect(img)
+    plot_label(result_bboxes)