[Other] Refactor js submodule (#415)

* Refactor js submodule

* Remove change-log

* Update ocr module

* Update ocr-detection module

* Update ocr-detection module

* Remove change-log
This commit is contained in:
chenqianhe
2022-10-23 14:05:13 +08:00
committed by GitHub
parent 30971cf3fd
commit f2619b0546
273 changed files with 14697 additions and 5088 deletions

View File

@@ -0,0 +1,216 @@
import clipper from 'js-clipper';
import { divide, enableBoundaryChecking, plus } from 'number-precision';
import CV from '@paddlejs-mediapipe/opencv/library/opencv_ocr';
import * as d3Polygon from 'd3-polygon';
import { BOX, POINT, POINTS } from "./type";
export default class DBPostprocess {
private readonly thresh: number;
private readonly box_thresh: number;
private readonly max_candidates: number;
private readonly unclip_ratio: number;
private readonly min_size: number;
private readonly pred: number[];
private readonly segmentation: number[];
private readonly width: number;
private readonly height: number;
constructor(result: number[], shape: number[], thresh=0.3, box_thresh=0.6, unclip_ratio=1.5) {
enableBoundaryChecking(false);
this.thresh = thresh ? thresh : 0.3;
this.box_thresh = box_thresh ? box_thresh : 0.6;
this.max_candidates = 1000;
this.unclip_ratio = unclip_ratio ? unclip_ratio:1.5;
this.min_size = 3;
this.width = shape[0];
this.height = shape[1];
this.pred = result;
this.segmentation = [];
this.pred.forEach((item: number) => {
this.segmentation.push(item > this.thresh ? 255 : 0);
});
}
public outputBox() {
// eslint-disable-next-line new-cap
const src = new CV.matFromArray(960, 960, CV.CV_8UC1, this.segmentation);
const contours = new CV.MatVector();
const hierarchy = new CV.Mat();
// 获取轮廓
CV.findContours(src, contours, hierarchy, CV.RETR_LIST, CV.CHAIN_APPROX_SIMPLE);
const num_contours = Math.min(contours.size(), this.max_candidates);
const boxes: BOX = [];
const scores: number[] = [];
const arr: number[] = [];
for (let i = 0; i < num_contours; i++) {
const contour = contours.get(i);
const minBox = this.get_mini_boxes(contour);
const points = minBox.points;
let side = minBox.side;
if (side < this.min_size) {
continue;
}
const score = this.box_score_fast(this.pred, points);
if (this.box_thresh > score) {
continue;
}
let box = this.unclip(points);
// eslint-disable-next-line new-cap
const boxMap = new CV.matFromArray(box.length / 2, 1, CV.CV_32SC2, box);
const resultObj = this.get_mini_boxes(boxMap);
box = resultObj.points;
side = resultObj.side;
if (side < this.min_size + 2) {
continue;
}
box.forEach(item => {
item[0] = this.clip(Math.round(item[0]), 0, this.width);
item[1] = this.clip(Math.round(item[1]), 0, this.height);
});
boxes.push(box);
scores.push(score);
arr.push(i);
boxMap.delete();
}
src.delete();
contours.delete();
hierarchy.delete();
return { boxes, scores };
}
private get_mini_boxes(contour) {
// 生成最小外接矩形
const bounding_box = CV.minAreaRect(contour);
const points: POINTS = [];
const mat = new CV.Mat();
// 获取矩形的四个顶点坐标
CV.boxPoints(bounding_box, mat);
for (let i = 0; i < mat.data32F.length; i += 2) {
const arr: POINT = [mat.data32F[i], mat.data32F[i + 1]];
points.push(arr);
}
function sortNumber(a: POINT, b: POINT) {
return a[0] - b[0];
}
points.sort(sortNumber);
let index_1: number;
let index_2: number;
let index_3: number;
let index_4: number;
if (points[1][1] > points[0][1]) {
index_1 = 0;
index_4 = 1;
}
else {
index_1 = 1;
index_4 = 0;
}
if (points[3][1] > points[2][1]) {
index_2 = 2;
index_3 = 3;
}
else {
index_2 = 3;
index_3 = 2;
}
const box = [
points[index_1],
points[index_2],
points[index_3],
points[index_4]
];
const side = Math.min(bounding_box.size.height, bounding_box.size.width);
mat.delete();
return { points: box, side };
}
private box_score_fast(bitmap: number[], _box: POINTS) {
const h = this.height;
const w = this.width;
const box = JSON.parse(JSON.stringify(_box));
const x = [] as number[];
const y = [] as number[];
box.forEach((item: POINT) => {
x.push(item[0]);
y.push(item[1]);
});
// clip这个函数将将数组中的元素限制在a_min, a_max之间大于a_max的就使得它等于 a_max小于a_min,的就使得它等于a_min。
const xmin = this.clip(Math.floor(Math.min(...x)), 0, w - 1);
const xmax = this.clip(Math.ceil(Math.max(...x)), 0, w - 1);
const ymin = this.clip(Math.floor(Math.min(...y)), 0, h - 1);
const ymax = this.clip(Math.ceil(Math.max(...y)), 0, h - 1);
// eslint-disable-next-line new-cap
const mask = new CV.Mat.zeros(ymax - ymin + 1, xmax - xmin + 1, CV.CV_8UC1);
box.forEach((item: POINT) => {
item[0] = Math.max(item[0] - xmin, 0);
item[1] = Math.max(item[1] - ymin, 0);
});
const npts = 4;
const point_data = new Uint8Array(box.flat());
const points = CV.matFromArray(npts, 1, CV.CV_32SC2, point_data);
const pts = new CV.MatVector();
pts.push_back(points);
const color = new CV.Scalar(255);
// 多个多边形填充
CV.fillPoly(mask, pts, color, 1);
const sliceArr = [];
for (let i = ymin; i < ymax + 1; i++) {
sliceArr.push(...bitmap.slice(960 * i + xmin, 960 * i + xmax + 1) as []);
}
const mean = this.mean(sliceArr, mask.data);
mask.delete();
points.delete();
pts.delete();
return mean;
}
private clip(data: number, min: number, max: number) {
return data < min ? min : data > max ? max : data;
}
private unclip(box: POINTS) {
const unclip_ratio = this.unclip_ratio;
const area = Math.abs(d3Polygon.polygonArea(box));
const length = d3Polygon.polygonLength(box);
const distance = area * unclip_ratio / length;
const tmpArr: { X: number; Y: number; }[] = [];
box.forEach(item => {
const obj = {
X: 0,
Y: 0
};
obj.X = item[0];
obj.Y = item[1];
tmpArr.push(obj);
});
const offset = new clipper.ClipperOffset();
offset.AddPath(tmpArr, clipper.JoinType.jtRound, clipper.EndType.etClosedPolygon);
const expanded: { X: number; Y: number; }[][] = [];
offset.Execute(expanded, distance);
let expandedArr: POINTS = [];
expanded[0] && expanded[0].forEach(item => {
expandedArr.push([item.X, item.Y]);
});
expandedArr = [].concat(...expandedArr as []);
return expandedArr;
}
private mean(data: number[], mask: number[]) {
let sum = 0;
let length = 0;
for (let i = 0; i < data.length; i++) {
if (mask[i]) {
sum = plus(sum, data[i]);
length++;
}
}
const num = divide(sum, length);
return num;
}
}

View File

@@ -0,0 +1,102 @@
/**
* @file ocr_det model
*/
import { Runner } from '@paddlejs/paddlejs-core';
import '@paddlejs/paddlejs-backend-webgl';
import DBProcess from './dbPostprocess';
const DEFAULTDETSHAPE = 960;
const canvas = document.createElement('canvas') as HTMLCanvasElement;
let detectRunner = null as Runner;
export interface DetPostConfig {
shape: number;
thresh: number;
box_thresh: number;
unclip_ratio: number;
}
const defaultPostConfig: DetPostConfig = {shape: 960, thresh: 0.3, box_thresh: 0.6, unclip_ratio:1.5};
// 通过canvas将上传原图大小转换为目标尺寸
initCanvas(canvas);
function initCanvas(canvas) {
canvas.style.position = 'absolute';
canvas.style.top = '0';
canvas.style.left = '0';
canvas.style.zIndex = '-1';
canvas.style.opacity = '0';
document.body.appendChild(canvas);
}
const defaultModelPath = 'https://js-models.bj.bcebos.com/PaddleOCR/PP-OCRv3/ch_PP-OCRv3_det_infer_js_960/model.json';
export async function load(detPath = '') {
detectRunner = new Runner({
modelPath: detPath ? detPath : defaultModelPath,
fill: '#fff',
mean: [0.485, 0.456, 0.406],
std: [0.229, 0.224, 0.225],
bgr: true
});
await detectRunner.init();
}
export async function detect(image, Config:DetPostConfig = defaultPostConfig) {
// 目标尺寸
const DETSHAPE = Config.shape ? Config.shape : DEFAULTDETSHAPE;
const thresh = Config.thresh;
const box_thresh = Config.box_thresh;
const unclip_ratio = Config.unclip_ratio;
const targetWidth = DETSHAPE;
const targetHeight = DETSHAPE;
canvas.width = targetWidth;
canvas.height = targetHeight;
const ctx = canvas.getContext('2d');
ctx!.fillStyle = '#fff';
ctx!.fillRect(0, 0, targetHeight, targetWidth);
// 缩放后的宽高
let sw = targetWidth;
let sh = targetHeight;
let x = 0;
let y = 0;
// target的长宽比大些 就把原图的高变成target那么高
if (targetWidth / targetHeight * image.naturalHeight / image.naturalWidth >= 1) {
sw = Math.round(sh * image.naturalWidth / image.naturalHeight);
x = Math.floor((targetWidth - sw) / 2);
}
// target的长宽比小些 就把原图的宽变成target那么宽
else {
sh = Math.round(sw * image.naturalHeight / image.naturalWidth);
y = Math.floor((targetHeight - sh) / 2);
}
ctx!.drawImage(image, x, y, sw, sh);
const shapeList = [DETSHAPE, DETSHAPE];
const outsDict = await detectRunner.predict(canvas);
const postResult = new DBProcess(outsDict, shapeList, thresh, box_thresh, unclip_ratio);
// 获取坐标
const result = postResult.outputBox();
// 转换原图坐标
const points = JSON.parse(JSON.stringify(result.boxes));
points && points.forEach(item => {
item.forEach(point => {
// 保证原图坐标不超出图片
point[0] = clip(
(Math.round(point[0] - x) * Math.max(image.naturalWidth, image.naturalHeight) / DETSHAPE),
0,
image.naturalWidth
);
point[1] = clip(
(Math.round(point[1] - y) * Math.max(image.naturalWidth, image.naturalHeight) / DETSHAPE),
0,
image.naturalHeight
);
});
});
return points;
}
function clip(data: number, min: number, max: number) {
return data < min ? min : data > max ? max : data;
}

View File

@@ -0,0 +1,3 @@
export type POINT = [number, number];
export type POINTS = POINT[];
export type BOX = POINTS[];