Meituan-Dianping
diff --git a/‎.gitignore‎
Lines changed: 5 additions & 0 deletions b/‎.gitignore‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎Dockerfile‎
Lines changed: 12 additions & 0 deletions b/‎Dockerfile‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎LICENSE‎
Lines changed: 21 additions & 0 deletions b/‎LICENSE‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 41 additions & 0 deletions b/‎README.md‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎api/vision_api.py‎
Lines changed: 62 additions & 0 deletions b/‎api/vision_api.py‎
Lines changed: 62 additions & 0 deletions
diff --git a/‎capture/image_1.png‎
243 KB b/‎capture/image_1.png‎
243 KB
diff --git a/‎dbnet_crnn/image_text.py‎
Lines changed: 95 additions & 0 deletions b/‎dbnet_crnn/image_text.py‎
Lines changed: 95 additions & 0 deletions
diff --git a/‎dbnet_crnn/modelv1.1/det/model‎
337 KB b/‎dbnet_crnn/modelv1.1/det/model‎
337 KB
diff --git a/‎dbnet_crnn/modelv1.1/det/params‎
2.19 MB b/‎dbnet_crnn/modelv1.1/det/params‎
2.19 MB
diff --git a/‎dbnet_crnn/modelv1.1/rec/model‎
440 KB b/‎dbnet_crnn/modelv1.1/rec/model‎
440 KB
@@ -0,0 +1,5 @@
+*.pyc
+.DS_Store
+.idea/
+capture/local_*/
+*.so
@@ -0,0 +1,12 @@
+FROM python:3.6.5
+COPY ./api /vision/api/
+COPY ./service /vision/service/
+COPY ./dbnet_crnn /vision/dbnet_crnn
+COPY ./requirements.txt /vision/requirements.txt
+COPY ./server.py ./vision/server.py
+ARG PIP_MIRROR=https://mirrors.aliyun.com/pypi/simple/
+WORKDIR /vision
+RUN mkdir capture\
+    && pip install --upgrade pip -i ${PIP_MIRROR}\
+    && pip install -r requirements.txt -i ${PIP_MIRROR}
+CMD ["python3", "server.py"]
@@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) 2019 美团点评
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
@@ -0,0 +1,41 @@
+# Vision UI
+
+![GitHub](https://img.shields.io/badge/Python-3.6-blue)
+![GitHub](https://img.shields.io/github/license/Meituan-Dianping/vision-diff)
+![GitHub](https://img.shields.io/docker/cloud/build/brighthai/vision-ui)
+
+## 什么是Vision UI
+
+Vision UI是一组图像处理算法，来源于美团视觉测试工具，提供如视觉对比(增量式对比)、图像融合和文本识别。
+
+本项目无需训练模型，基于训练模型的项目在[Vision-ml](https://github.com/Meituan-Dianping/vision)
+
+## 特性
+
+* 超越像素对比-[视觉对比](resources/vision_diff_cn.md)
+
+* 基于模板匹配-[图像融合](resources/vision_merge.md)
+
+* 集成模型-[文本识别](resources/vision_text.md)
+
+
+## 效果展示
+### 图像融合
+| 1.png                           | 2.png                           |  3.png                   | merge                                  |
+| ------------------------------ | -------------------------------- | -------------------------------- | ------------------------------------- |
+| ![](image/1_0.png)          | ![](image/1_1.png)                  | ![](image/1_2.png)        | ![](image/1_merge.png)                 
+
+### 视觉对比
+
+| base                           | comparison                       | diff                                  |
+| ------------------------------ | -------------------------------- | ------------------------------------- |
+| ![](image/base_1.png)          | ![](image/comp_1.png)            | ![](image/diff_1.png)                 |
+
+
+
+
+## License
+
+This project is licensed under the [MIT](./LICENSE) 
+
+
@@ -0,0 +1,62 @@
+from flask import jsonify
+from flask import request
+from flask import Blueprint
+from flask import make_response
+from service.image_diff import ImageDiff
+from service.image_merge import Stitcher
+from service.image_similar import HashSimilar
+from service.image_text import get_image_text
+from service.image_utils import get_pop_v
+
+vision = Blueprint('vision', __name__, url_prefix='/vision')
+
+
+@vision.route('/diff', methods=["POST"])
+def vision_diff():
+    data = {
+        "code": 0,
+        "data": ImageDiff().get_image_score(request.json['image1'], request.json['image2'],
+                                            request.json['image_diff_name'])
+    }
+    return jsonify(data)
+
+
+@vision.route('/merge', methods=["POST"])
+def vision_merge():
+    data = {
+        "code": 0,
+        "data": Stitcher(request.json['image_list']).image_merge(
+            request.json['name'],
+            without_padding=request.json.get('without_padding')
+        )
+    }
+    return jsonify(data)
+
+
+@vision.route('/similar', methods=["POST"])
+def vision_similar():
+    data = {
+        "code": 0,
+        "data": HashSimilar().get_hash_similar(request.json['image1'], request.json['image2'])
+    }
+    return jsonify(data)
+
+
+@vision.route('/pop', methods=["POST"])
+def vision_pop():
+    data = {
+        "code": 0,
+        "data": get_pop_v(request.json['image'])
+    }
+    return jsonify(data)
+
+
+@vision.route('/text', methods=["POST"])
+def vision_text():
+    data = {
+        "code": 0,
+        "data": get_image_text(request.json['image'])
+    }
+    resp = make_response(jsonify(data))
+    resp.headers["Content-Type"] = "application/json;charset=utf-8"
+    return resp
@@ -0,0 +1,95 @@
+import cv2
+import copy
+import numpy as np
+import dbnet_crnn.tools.utility as utility
+from service.image_utils import get_center_pos
+import dbnet_crnn.tools.predict_det as predict_det
+import dbnet_crnn.tools.predict_rec as predict_rec
+
+
+def sorted_boxes(dt_boxes):
+    """
+    Sort text boxes in order from top to bottom, left to right
+    args:
+        dt_boxes(array):detected text boxes with shape [4, 2]
+    return:
+        sorted boxes(array) with shape [4, 2]
+    """
+    num_boxes = dt_boxes.shape[0]
+    sorted_boxes = sorted(dt_boxes, key=lambda x: (x[0][1], x[0][0]))
+    _boxes = list(sorted_boxes)
+
+    for i in range(num_boxes - 1):
+        if abs(_boxes[i+1][0][1] - _boxes[i][0][1]) < 10 and (_boxes[i + 1][0][0] < _boxes[i][0][0]):
+            tmp = _boxes[i]
+            _boxes[i] = _boxes[i + 1]
+            _boxes[i + 1] = tmp
+    return _boxes
+
+
+class ImageText(object):
+    def __init__(self):
+        args = utility.parse_args()
+        self.text_detector = predict_det.TextDetector(args, model_path='dbnet_crnn/modelv1.1/det/')
+        self.text_recognizer = predict_rec.TextRecognizer(args, model_path='dbnet_crnn/modelv1.1/rec/')
+
+    def get_rotate_crop_image(self, img, points):
+        '''
+        img_height, img_width = img.shape[0:2]
+        left = int(np.min(points[:, 0]))
+        right = int(np.max(points[:, 0]))
+        top = int(np.min(points[:, 1]))
+        bottom = int(np.max(points[:, 1]))
+        img_crop = img[top:bottom, left:right, :].copy()
+        points[:, 0] = points[:, 0] - left
+        points[:, 1] = points[:, 1] - top
+        '''
+        img_crop_width = int(
+            max(
+                np.linalg.norm(points[0] - points[1]),
+                np.linalg.norm(points[2] - points[3])))
+        img_crop_height = int(
+            max(
+                np.linalg.norm(points[0] - points[3]),
+                np.linalg.norm(points[1] - points[2])))
+        pts_std = np.float32([[0, 0], [img_crop_width, 0],
+                              [img_crop_width, img_crop_height],
+                              [0, img_crop_height]])
+        M = cv2.getPerspectiveTransform(points, pts_std)
+        dst_img = cv2.warpPerspective(img, M, (img_crop_width, img_crop_height),
+                                      borderMode=cv2.BORDER_REPLICATE,
+                                      flags=cv2.INTER_CUBIC)
+        dst_img_height, dst_img_width = dst_img.shape[0:2]
+        if dst_img_height * 1.0 / dst_img_width >= 1.5:
+            dst_img = np.rot90(dst_img)
+        return dst_img
+
+    def get_ocr(self, img, max_side_len):
+        ori_im = img.copy()
+        dt_boxes = self.text_detector(img, max_side_len)
+        if dt_boxes is None:
+            return None, None
+        img_crop_list = []
+        dt_boxes = sorted_boxes(dt_boxes)
+        for bno in range(len(dt_boxes)):
+            tmp_box = copy.deepcopy(dt_boxes[bno])
+            img_crop = self.get_rotate_crop_image(ori_im, tmp_box)
+            img_crop_list.append(img_crop)
+        rec_res = self.text_recognizer(img_crop_list)
+        return dt_boxes, rec_res
+
+    def get_text(self, img, max_side_len, score_thresh=0.6):
+        result = []
+        dt_boxes, rec_res = self.get_ocr(img, max_side_len)
+        for roi_ocr in list(zip(dt_boxes, rec_res)):
+            roi_score = roi_ocr[1][1]
+            if roi_score > score_thresh:
+                result.append({
+                    'pos': get_center_pos(roi_ocr[0]),
+                    'text': roi_ocr[1][0],
+                    'score': round(float(roi_score), 2)
+                })
+        return result
+
+
+image_text = ImageText()
-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +*.pyc
 +.DS_Store
 +.idea/
 +capture/local_*/
 +*.so