初次提交

2025-03-06 14:38:32 +08:00
commit b0e71d0ebb
46 changed files with 1926 additions and 0 deletions
--- a/src/backend/common/index.ts
+++ b/src/backend/common/index.ts
@ -0,0 +1 @@
+export * from "./session";
--- a/src/backend/common/session.ts
+++ b/src/backend/common/session.ts
@ -0,0 +1,28 @@
+
+
+export interface SessionNodeInfo {
+	name: string
+	type: number
+	shape: number[]
+}
+
+export type SessionNodeType = "float32" | "float64" | "float" | "double" | "int32" | "uint32" | "int16" | "uint16" | "int8" | "uint8" | "int64" | "uint64"
+
+export type SessionNodeData = Float32Array | Float64Array | Int32Array | Uint32Array | Int16Array | Uint16Array | Int8Array | Uint8Array | BigInt64Array | BigUint64Array
+
+export interface SessionRunInputOption {
+	type?: SessionNodeType
+	data: SessionNodeData
+	shape?: number[]
+}
+
+export abstract class CommonSession {
+	public abstract run(inputs: Record<string, SessionNodeData | SessionRunInputOption>): Promise<Record<string, Float32Array>>
+
+	public abstract get inputs(): Record<string, SessionNodeInfo>;
+	public abstract get outputs(): Record<string, SessionNodeInfo>;
+}
+
+export function isTypedArray(val: any): val is SessionNodeData {
+	return val?.buffer instanceof ArrayBuffer;
+}
--- a/src/backend/index.ts
+++ b/src/backend/index.ts
@ -0,0 +1 @@
+export * as backend from "./main";
--- a/src/backend/main.ts
+++ b/src/backend/main.ts
@ -0,0 +1,2 @@
+export * as common from "./common";
+export * as ort from "./ort";
--- a/src/backend/ort/index.ts
+++ b/src/backend/ort/index.ts
@ -0,0 +1 @@
+export { OrtSession as Session } from "./session";
--- a/src/backend/ort/session.ts
+++ b/src/backend/ort/session.ts
@ -0,0 +1,32 @@
+import { CommonSession, isTypedArray, SessionNodeData, SessionNodeInfo, SessionRunInputOption } from "../common";
+
+export class OrtSession extends CommonSession {
+	#session: any;
+	#inputs: Record<string, SessionNodeInfo> | null = null;
+	#outputs: Record<string, SessionNodeInfo> | null = null;
+
+	public constructor(modelData: Uint8Array) {
+		super();
+		const addon = require("../../../build/ort.node")
+		this.#session = new addon.OrtSession(modelData);
+	}
+
+	public get inputs(): Record<string, SessionNodeInfo> { return this.#inputs ??= this.#session.GetInputsInfo(); }
+
+	public get outputs(): Record<string, SessionNodeInfo> { return this.#outputs ??= this.#session.GetOutputsInfo(); }
+
+	public run(inputs: Record<string, SessionNodeData | SessionRunInputOption>) {
+		const inputArgs: Record<string, any> = {};
+		for (const [name, option] of Object.entries(inputs)) {
+			if (isTypedArray(option)) inputArgs[name] = { data: option }
+			else inputArgs[name] = option;
+		}
+
+		return new Promise<Record<string, Float32Array>>((resolve, reject) => this.#session.Run(inputArgs, (err: any, res: any) => {
+			if (err) return reject(err);
+			const result: Record<string, Float32Array> = {};
+			for (const [name, val] of Object.entries(res)) result[name] = new Float32Array(val as ArrayBuffer);
+			resolve(result);
+		}));
+	}
+}
--- a/src/cv/index.ts
+++ b/src/cv/index.ts
@ -0,0 +1 @@
+export * as cv from "./main";
--- a/src/cv/main.ts
+++ b/src/cv/main.ts
@ -0,0 +1 @@
+export { Mat, ImreadModes } from "./mat";
--- a/src/cv/mat.ts
+++ b/src/cv/mat.ts
@ -0,0 +1,79 @@
+
+export enum ImreadModes {
+	IMREAD_UNCHANGED = -1,
+	IMREAD_GRAYSCALE = 0,
+	IMREAD_COLOR_BGR = 1,
+	IMREAD_COLOR = 1,
+	IMREAD_ANYDEPTH = 2,
+	IMREAD_ANYCOLOR = 4,
+	IMREAD_LOAD_GDAL = 8,
+	IMREAD_REDUCED_GRAYSCALE_2 = 16,
+	IMREAD_REDUCED_COLOR_2 = 17,
+	IMREAD_REDUCED_GRAYSCALE_4 = 32,
+	IMREAD_REDUCED_COLOR_4 = 33,
+	IMREAD_REDUCED_GRAYSCALE_8 = 64,
+	IMREAD_REDUCED_COLOR_8 = 65,
+	IMREAD_IGNORE_ORIENTATION = 128,
+	IMREAD_COLOR_RGB = 256,
+};
+
+interface MatConstructorOption {
+	mode?: ImreadModes;
+}
+
+export class Mat {
+	#mat: any
+
+	public static async load(image: string, option?: MatConstructorOption) {
+		let buffer: Uint8Array
+		if (/^https?:\/\//.test(image)) buffer = await fetch(image).then(res => res.arrayBuffer()).then(res => new Uint8Array(res));
+		else buffer = await import("fs").then(fs => fs.promises.readFile(image));
+		return new Mat(buffer, option);
+	}
+
+	public constructor(imageData: Uint8Array, option?: MatConstructorOption) {
+		const addon = require("../../build/cv.node");
+		if ((imageData as any) instanceof addon.Mat) this.#mat = imageData;
+		else this.#mat = new addon.Mat(imageData, option);
+	}
+
+	public get empty(): boolean { return this.#mat.IsEmpty() }
+
+	public get cols(): number { return this.#mat.GetCols(); }
+
+	public get rows(): number { return this.#mat.GetRows(); }
+
+	public get width() { return this.cols; }
+
+	public get height() { return this.rows; }
+
+	public get channels() { return this.#mat.GetChannels(); }
+
+	public resize(width: number, height: number) { return new Mat(this.#mat.Resize.bind(this.#mat)(width, height)); }
+
+	public crop(sx: number, sy: number, sw: number, sh: number) { return new Mat(this.#mat.Crop(sx, sy, sw, sh)); }
+
+	public rotate(sx: number, sy: number, angleDeg: number) { return new Mat(this.#mat.Rotate(sx, sy, angleDeg)); }
+
+	public get data() { return new Uint8Array(this.#mat.Data()); }
+
+	public encode(extname: string) { return new Uint8Array(this.#mat.Encode({ extname })); }
+
+	public clone() { return new Mat(this.#mat.Clone()); }
+
+	public circle(x: number, y: number, radius: number, options?: {
+		color?: { r: number, g: number, b: number },
+		thickness?: number
+		lineType?: number
+	}) {
+		this.#mat.DrawCircle(
+			x, y, radius,
+			options?.color?.b ?? 0,
+			options?.color?.g ?? 0,
+			options?.color?.r ?? 0,
+			options?.thickness ?? 1,
+			options?.lineType ?? 8,
+			0,
+		);
+	}
+}
--- a/src/deploy/common/model.ts
+++ b/src/deploy/common/model.ts
@ -0,0 +1,37 @@
+import { backend } from "../../backend";
+import { cv } from "../../cv";
+
+export type ModelConstructor<T> = new (session: backend.common.CommonSession) => T;
+
+export type ImageSource = cv.Mat | Uint8Array | string;
+
+export interface ImageCropOption {
+	/** 图片裁剪区域 */
+	crop?: { sx: number, sy: number, sw: number, sh: number }
+}
+
+export abstract class Model {
+	protected session: backend.common.CommonSession;
+
+	protected static async resolveImage<R>(image: ImageSource, resolver: (image: cv.Mat) => R | Promise<R>): Promise<R> {
+		if (typeof image === "string") {
+			if (/^https?:\/\//.test(image)) image = await fetch(image).then(res => res.arrayBuffer()).then(buffer => new Uint8Array(buffer));
+			else image = await import("fs").then(fs => fs.promises.readFile(image as string));
+		}
+		if (image instanceof Uint8Array) image = new cv.Mat(image, { mode: cv.ImreadModes.IMREAD_COLOR_BGR })
+		if (image instanceof cv.Mat) return await resolver(image);
+		else throw new Error("Invalid image");
+	}
+
+	public static fromOnnx<T extends Model>(this: ModelConstructor<T>, modelData: Uint8Array) {
+		return new this(new backend.ort.Session(modelData));
+	}
+
+	public constructor(session: backend.common.CommonSession) { this.session = session; }
+
+
+	public get inputs() { return this.session.inputs; }
+	public get outputs() { return this.session.outputs; }
+	public get input() { return Object.entries(this.inputs)[0][1]; }
+	public get output() { return Object.entries(this.outputs)[0][1]; }
+}
--- a/src/deploy/common/processors.ts
+++ b/src/deploy/common/processors.ts
@ -0,0 +1,84 @@
+
+
+interface IConverImageOption {
+	sourceImageFormat: "rgba" | "rgb" | "bgr"
+	targetShapeFormat?: "nchw" | "nhwc"
+	targetColorFormat?: "rgb" | "bgr" | "gray"
+	targetNormalize?: { mean: number[], std: number[] }
+}
+
+export function convertImage(image: Uint8Array, option?: IConverImageOption) {
+	const sourceImageFormat = option?.sourceImageFormat ?? "rgb";
+	const targetShapeFormat = option?.targetShapeFormat ?? "nchw";
+	const targetColorFormat = option?.targetColorFormat ?? "bgr";
+	const targetNormalize = option?.targetNormalize ?? { mean: [127.5], std: [127.5] };
+
+	let rgbReader: (pixel: number) => [number, number, number];
+	let pixelCount: number;
+	switch (sourceImageFormat) {
+		case "bgr":
+			rgbReader = pixel => [image[pixel * 3 + 2], image[pixel * 3 + 1], image[pixel * 3 + 0]];
+			pixelCount = image.length / 3;
+			break;
+		case "rgb":
+			rgbReader = pixel => [image[pixel * 3 + 0], image[pixel * 3 + 1], image[pixel * 3 + 2]];
+			pixelCount = image.length / 3;
+			break;
+		case "rgba":
+			rgbReader = pixel => [image[pixel * 4 + 0], image[pixel * 4 + 1], image[pixel * 4 + 2]];
+			pixelCount = image.length / 4;
+			break;
+	}
+
+	let targetChannelGetter: (stride: number, pixel: number, offset: number) => number;
+	switch (targetShapeFormat) {
+		case "nchw":
+			targetChannelGetter = (stride, pixel, offset) => stride * offset + pixel;
+			break;
+		case "nhwc":
+			targetChannelGetter = (stride, pixel, offset) => stride * pixel + offset;
+			break
+	}
+
+	let normIndex = 0;
+	const normValue = (val: number) => {
+		const mean = targetNormalize.mean[normIndex % targetNormalize.mean.length];
+		const std = targetNormalize.std[normIndex % targetNormalize.std.length];
+		const result = (val - mean) / std;
+		++normIndex;
+		return result;
+	}
+
+	let outBuffer: Float32Array;
+	let pixelWriter: (pixel: number, r: number, g: number, b: number) => any
+	switch (targetColorFormat) {
+		case "rgb":
+			outBuffer = new Float32Array(pixelCount * 3);
+			pixelWriter = (pixel, r, g, b) => {
+				outBuffer[targetChannelGetter(3, pixel, 0)] = normValue(r);
+				outBuffer[targetChannelGetter(3, pixel, 1)] = normValue(g);
+				outBuffer[targetChannelGetter(3, pixel, 2)] = normValue(b);
+			}
+			break;
+		case "bgr":
+			outBuffer = new Float32Array(pixelCount * 3);
+			pixelWriter = (pixel, r, g, b) => {
+				outBuffer[targetChannelGetter(3, pixel, 0)] = normValue(b);
+				outBuffer[targetChannelGetter(3, pixel, 1)] = normValue(g);
+				outBuffer[targetChannelGetter(3, pixel, 2)] = normValue(r);
+			}
+			break;
+		case "gray":
+			outBuffer = new Float32Array(pixelCount);
+			pixelWriter = (pixel, r, g, b) => {
+				outBuffer[targetChannelGetter(1, pixel, 0)] = normValue(0.2126 * r + 0.7152 * g + 0.0722 * b);
+			}
+			break;
+	}
+
+	for (let i = 0; i < pixelCount; ++i) {
+		const [r, g, b] = rgbReader(i);
+		pixelWriter(i, r, g, b);
+	}
+	return outBuffer;
+}
--- a/src/deploy/facealign/common.ts
+++ b/src/deploy/facealign/common.ts
@ -0,0 +1,58 @@
+export interface FacePoint {
+	x: number
+	y: number
+}
+
+type PointType = "leftEye" | "rightEye" | "leftEyebrow" | "rightEyebrow" | "nose" | "mouth" | "contour"
+
+export abstract class FaceAlignmentResult {
+	#points: FacePoint[]
+
+	public constructor(points: FacePoint[]) { this.#points = points; }
+
+	/** 关键点 */
+	public get points() { return this.#points; }
+
+	/** 获取特定的关键点 */
+	public getPointsOf(type: PointType | PointType[]) {
+		if (typeof type == "string") type = [type];
+		const result: FacePoint[] = [];
+		for (const t of type) {
+			for (const idx of this[`${t}PointIndex` as const]()) {
+				result.push(this.points[idx]);
+			}
+		}
+		return result;
+	}
+
+	/** 方向 */
+	public get direction() {
+		const [{ x: x1, y: y1 }, { x: x2, y: y2 }] = this.directionPointIndex().map(idx => this.points[idx]);
+		return Math.atan2(y1 - y2, x2 - x1)
+	}
+
+	/** 用于判断方向的两个点的索引(建议选取眼球中间的点) */
+	protected abstract directionPointIndex(): [number, number];
+	/** 左眼点的索引 */
+	protected abstract leftEyePointIndex(): number[];
+	/** 右眼点的索引 */
+	protected abstract rightEyePointIndex(): number[];
+	/** 左眉点的索引 */
+	protected abstract leftEyebrowPointIndex(): number[];
+	/** 右眉点的索引 */
+	protected abstract rightEyebrowPointIndex(): number[];
+	/** 嘴巴点的索引 */
+	protected abstract mouthPointIndex(): number[];
+	/** 鼻子的索引 */
+	protected abstract nosePointIndex(): number[];
+	/** 轮廓点的索引 */
+	protected abstract contourPointIndex(): number[];
+
+	protected indexFromTo(from: number, to: number) {
+		const indexes: number[] = [];
+		for (let i = from; i <= to; i++) {
+			indexes.push(i);
+		}
+		return indexes;
+	}
+}
--- a/src/deploy/facealign/index.ts
+++ b/src/deploy/facealign/index.ts
@ -0,0 +1,2 @@
+export { PFLD } from "./pfld";
+export { FaceLandmark1000 } from "./landmark1000";
--- a/src/deploy/facealign/landmark1000.ts
+++ b/src/deploy/facealign/landmark1000.ts
@ -0,0 +1,52 @@
+import { writeFileSync } from "fs";
+import { cv } from "../../cv";
+import { ImageCropOption, ImageSource, Model } from "../common/model";
+import { convertImage } from "../common/processors";
+import { FaceAlignmentResult, FacePoint } from "./common";
+
+interface FaceLandmark1000PredictOption extends ImageCropOption { }
+
+class FaceLandmark1000Result extends FaceAlignmentResult {
+	protected directionPointIndex(): [number, number] { return [401, 529]; }
+	protected leftEyePointIndex(): number[] { return this.indexFromTo(401, 528); }
+	protected rightEyePointIndex(): number[] { return this.indexFromTo(529, 656); }
+	protected leftEyebrowPointIndex(): number[] { return this.indexFromTo(273, 336); }
+	protected rightEyebrowPointIndex(): number[] { return this.indexFromTo(337, 400); }
+	protected mouthPointIndex(): number[] { return this.indexFromTo(845, 972); }
+	protected nosePointIndex(): number[] { return this.indexFromTo(657, 844); }
+	protected contourPointIndex(): number[] { return this.indexFromTo(0, 272); }
+}
+
+export class FaceLandmark1000 extends Model {
+
+	public predict(image: ImageSource, option?: FaceLandmark1000PredictOption) { return Model.resolveImage(image, im => this.doPredict(im, option)); }
+
+	public async doPredict(image: cv.Mat, option?: FaceLandmark1000PredictOption) {
+		const input = this.input;
+		if (option?.crop) image = image.crop(option.crop.sx, option.crop.sy, option.crop.sw, option.crop.sh);
+		const ratioWidth = image.width / input.shape[3];
+		const ratioHeight = image.height / input.shape[2];
+		image = image.resize(input.shape[3], input.shape[2]);
+
+		const nchwImageData = convertImage(image.data, { sourceImageFormat: "bgr", targetColorFormat: "gray", targetShapeFormat: "nchw", targetNormalize: { mean: [0], std: [1] } });
+
+		const res = await this.session.run({
+			[input.name]: {
+				shape: [1, 1, input.shape[2], input.shape[3]],
+				data: nchwImageData,
+				type: "float32",
+			}
+		}).then(res => res[this.output.name]);
+
+		const points: FacePoint[] = [];
+		for (let i = 0; i < res.length; i += 2) {
+			const x = res[i] * image.width * ratioWidth;
+			const y = res[i + 1] * image.height * ratioHeight;
+			points.push({ x, y });
+		}
+
+		return new FaceLandmark1000Result(points);
+
+	}
+
+}
--- a/src/deploy/facealign/pfld.ts
+++ b/src/deploy/facealign/pfld.ts
@ -0,0 +1,53 @@
+import { writeFileSync } from "fs";
+import { cv } from "../../cv";
+import { ImageCropOption, ImageSource, Model } from "../common/model";
+import { convertImage } from "../common/processors";
+import { FaceAlignmentResult, FacePoint } from "./common";
+
+export interface PFLDPredictOption extends ImageCropOption { }
+
+class PFLDResult extends FaceAlignmentResult {
+	protected directionPointIndex(): [number, number] { return [36, 92]; }
+	protected leftEyePointIndex(): number[] { return [33, 34, 35, 36, 37, 38, 39, 40, 41, 42]; }
+	protected rightEyePointIndex(): number[] { return [87, 88, 89, 90, 91, 92, 93, 94, 95, 96]; }
+	protected leftEyebrowPointIndex(): number[] { return [43, 44, 45, 46, 47, 48, 49, 50, 51]; }
+	protected rightEyebrowPointIndex(): number[] { return [97, 98, 99, 100, 101, 102, 103, 104, 105]; }
+	protected mouthPointIndex(): number[] { return [52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71]; }
+	protected nosePointIndex(): number[] { return [72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86]; }
+	protected contourPointIndex(): number[] { return [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32]; }
+}
+
+export class PFLD extends Model {
+	public predict(image: ImageSource, option?: PFLDPredictOption) { return Model.resolveImage(image, im => this.doPredict(im, option)); }
+
+	private async doPredict(image: cv.Mat, option?: PFLDPredictOption) {
+		const input = this.input;
+		if (option?.crop) image = image.crop(option.crop.sx, option.crop.sy, option.crop.sw, option.crop.sh);
+		const ratioWidth = image.width / input.shape[3];
+		const ratioHeight = image.height / input.shape[2];
+		image = image.resize(input.shape[3], input.shape[2]);
+
+		const nchwImageData = convertImage(image.data, { sourceImageFormat: "bgr", targetColorFormat: "bgr", targetShapeFormat: "nchw", targetNormalize: { mean: [0], std: [255] } })
+
+		const pointsOutput = Object.entries(this.outputs).filter(([_, out]) => out.shape.length == 2)[0][1];
+
+		const res = await this.session.run({
+			[input.name]: {
+				type: "float32",
+				data: nchwImageData,
+				shape: [1, 3, input.shape[2], input.shape[3]],
+			}
+		});
+		const pointsBuffer = res[pointsOutput.name];
+
+		const points: FacePoint[] = [];
+		for (let i = 0; i < pointsBuffer.length; i += 2) {
+			const x = pointsBuffer[i] * image.width * ratioWidth;
+			const y = pointsBuffer[i + 1] * image.height * ratioHeight;
+			points.push({ x, y });
+		}
+
+		return new PFLDResult(points);
+	}
+
+}
--- a/src/deploy/faceattr/gender-age.ts
+++ b/src/deploy/faceattr/gender-age.ts
@ -0,0 +1,40 @@
+import { cv } from "../../cv";
+import { ImageCropOption, ImageSource, Model } from "../common/model";
+import { convertImage } from "../common/processors";
+
+interface GenderAgePredictOption extends ImageCropOption {
+}
+
+export interface GenderAgePredictResult {
+	gender: "M" | "F"
+	age: number
+}
+
+
+export class GenderAge extends Model {
+	private async doPredict(image: cv.Mat, option?: GenderAgePredictOption): Promise<GenderAgePredictResult> {
+		const input = this.input;
+		const output = this.output;
+		if (option?.crop) image = image.crop(option.crop.sx, option.crop.sy, option.crop.sw, option.crop.sh);
+		image = image.resize(input.shape[3], input.shape[2]);
+
+		const nchwImage = convertImage(image.data, { sourceImageFormat: "bgr", targetColorFormat: "rgb", targetShapeFormat: "nchw", targetNormalize: { mean: [0], std: [1] } });
+
+		const result = await this.session.run({
+			[input.name]: {
+				shape: [1, 3, input.shape[2], input.shape[3]],
+				data: nchwImage,
+				type: "float32",
+			}
+		}).then(res => res[output.name]);
+
+		return {
+			gender: result[0] > result[1] ? "F" : "M",
+			age: parseInt(result[2] * 100 as any),
+		}
+	}
+
+	public predict(image: ImageSource, option?: GenderAgePredictOption) {
+		return Model.resolveImage(image, im => this.doPredict(im, option));
+	}
+}
--- a/src/deploy/faceattr/index.ts
+++ b/src/deploy/faceattr/index.ts
@ -0,0 +1 @@
+export { GenderAge as GenderAgeDetector } from "./gender-age";
--- a/src/deploy/facedet/common.ts
+++ b/src/deploy/facedet/common.ts
@ -0,0 +1,103 @@
+import { cv } from "../../cv"
+import { ImageSource, Model } from "../common/model"
+
+interface IFaceBoxConstructorOption {
+	x1: number
+	y1: number
+	x2: number
+	y2: number
+	score: number
+	imw: number
+	imh: number
+}
+
+export class FaceBox {
+	#option: IFaceBoxConstructorOption;
+	constructor(option: IFaceBoxConstructorOption) { this.#option = option; }
+
+	public get x1() { return this.#option.x1; }
+	public get y1() { return this.#option.y1; }
+	public get x2() { return this.#option.x2; }
+	public get y2() { return this.#option.y2; }
+	public get centerX() { return this.x1 + this.width / 2; }
+	public get centerY() { return this.y1 + this.height / 2; }
+	public get score() { return this.#option.score; }
+	public get left() { return this.x1; }
+	public get top() { return this.y1; }
+	public get width() { return this.x2 - this.x1; }
+	public get height() { return this.y2 - this.y1; }
+
+	/** 转换成整数 */
+	public toInt() {
+		return new FaceBox({
+			...this.#option,
+			x1: parseInt(this.#option.x1 as any), y1: parseInt(this.#option.y1 as any),
+			x2: parseInt(this.#option.x2 as any), y2: parseInt(this.#option.y2 as any),
+		});
+	}
+
+	/** 转换成正方形 */
+	public toSquare() {
+		const { imw, imh } = this.#option;
+		let size = Math.max(this.width, this.height) / 2;
+		const cx = this.centerX, cy = this.centerY;
+		console.log(this)
+
+		if (cx - size < 0) size = cx;
+		if (cx + size > imw) size = imw - cx;
+		if (cy - size < 0) size = cy;
+		if (cy + size > imh) size = imh - cy;
+
+		return new FaceBox({
+			...this.#option,
+			x1: this.centerX - size, y1: this.centerY - size,
+			x2: this.centerX + size, y2: this.centerY + size,
+		});
+	}
+}
+
+export interface FaceDetectOption {
+	/** 阈值，默认0.5 */
+	threshold?: number
+	/** MNS阈值，默认0.3 */
+	mnsThreshold?: number
+}
+
+export abstract class FaceDetector extends Model {
+
+	protected abstract doPredict(image: cv.Mat, option?: FaceDetectOption): Promise<FaceBox[]>;
+
+	public async predict(image: ImageSource, option?: FaceDetectOption) { return Model.resolveImage(image, im => this.doPredict(im, option)); }
+}
+
+
+export function nms(input: FaceBox[], threshold: number) {
+	if (!input.length) return [];
+	input = input.sort((a, b) => b.score - a.score);
+	const merged = input.map(() => 0);
+	const output: FaceBox[] = [];
+
+	for (let i = 0; i < input.length; i++) {
+		if (merged[i]) continue;
+		output.push(input[i]);
+
+		for (let j = i + 1; j < input.length; j++) {
+			if (merged[j]) continue;
+			const inner_x0 = input[i].x1 > input[j].x1 ? input[i].x1 : input[j].x1;
+			const inner_y0 = input[i].y1 > input[j].y1 ? input[i].y1 : input[j].y1;
+			const inner_x1 = input[i].x2 < input[j].x2 ? input[i].x2 : input[j].x2;
+			const inner_y1 = input[i].y2 < input[j].y2 ? input[i].y2 : input[j].y2;
+			const inner_h = inner_y1 - inner_y0 + 1;
+			const inner_w = inner_x1 - inner_x0 + 1;
+			if (inner_h <= 0 || inner_w <= 0) continue;
+			const inner_area = inner_h * inner_w;
+			const h1 = input[j].y2 - input[j].y1 + 1;
+			const w1 = input[j].x2 - input[j].x1 + 1;
+			const area1 = h1 * w1;
+			const score = inner_area / area1;
+			if (score > threshold) merged[j] = 1;
+		}
+	}
+
+	return output;
+}
--- a/src/deploy/facedet/index.ts
+++ b/src/deploy/facedet/index.ts
@ -0,0 +1,2 @@
+export { FaceBox } from "./common";
+export { Yolov5Face } from "./yolov5";
--- a/src/deploy/facedet/yolov5.ts
+++ b/src/deploy/facedet/yolov5.ts
@ -0,0 +1,37 @@
+import { cv } from "../../cv";
+import { convertImage } from "../common/processors";
+import { FaceBox, FaceDetectOption, FaceDetector, nms } from "./common";
+
+export class Yolov5Face extends FaceDetector {
+
+	public async doPredict(image: cv.Mat, option?: FaceDetectOption): Promise<FaceBox[]> {
+		const input = this.input;
+		const resizedImage = image.resize(input.shape[2], input.shape[3]);
+		const ratioWidth = image.width / resizedImage.width;
+		const ratioHeight = image.height / resizedImage.height;
+		const nchwImageData = convertImage(resizedImage.data, { sourceImageFormat: "bgr", targetColorFormat: "bgr", targetShapeFormat: "nchw", targetNormalize: { mean: [127.5], std: [127.5] } });
+
+		const outputData = await this.session.run({ input: nchwImageData }).then(r => r.output);
+		const outShape = this.outputs["output"].shape;
+
+		const faces: FaceBox[] = [];
+		const threshold = option?.threshold ?? 0.5;
+		for (let i = 0; i < outShape[1]; i++) {
+			const beg = i * outShape[2];
+			const rectData = outputData.slice(beg, beg + outShape[2]);
+			const x = parseInt(rectData[0] * ratioWidth as any);
+			const y = parseInt(rectData[1] * ratioHeight as any);
+			const w = parseInt(rectData[2] * ratioWidth as any);
+			const h = parseInt(rectData[3] * ratioHeight as any);
+			const score = rectData[4] * rectData[15];
+			if (score < threshold) continue;
+			faces.push(new FaceBox({
+				x1: x - w / 2, y1: y - h / 2,
+				x2: x + w / 2, y2: y + h / 2,
+				score, imw: image.width, imh: image.height,
+			}))
+		}
+		return nms(faces, option?.mnsThreshold ?? 0.3).map(box => box.toInt());
+	}
+
+}
--- a/src/deploy/faceid/adaface.ts
+++ b/src/deploy/faceid/adaface.ts
@ -0,0 +1,27 @@
+import { Mat } from "../../cv/mat";
+import { convertImage } from "../common/processors";
+import { FaceRecognition, FaceRecognitionPredictOption } from "./common";
+
+export class AdaFace extends FaceRecognition {
+
+	public async doPredict(image: Mat, option?: FaceRecognitionPredictOption): Promise<number[]> {
+		const input = this.input;
+		const output = this.output;
+
+		if (option?.crop) image = image.crop(option.crop.sx, option.crop.sy, option.crop.sw, option.crop.sh);
+		image = image.resize(input.shape[3], input.shape[2]);
+
+		const nchwImageData = convertImage(image.data, { sourceImageFormat: "bgr", targetColorFormat: "rgb", targetShapeFormat: "nchw", targetNormalize: { mean: [127.5], std: [127.5] } });
+
+		const embedding = await this.session.run({
+			[input.name]: {
+				type: "float32",
+				data: nchwImageData,
+				shape: [1, 3, input.shape[2], input.shape[3]],
+			}
+		}).then(res => res[output.name]);
+
+		return new Array(...embedding);
+	}
+
+}
--- a/src/deploy/faceid/common.ts
+++ b/src/deploy/faceid/common.ts
@ -0,0 +1,31 @@
+import { cv } from "../../cv";
+import { ImageCropOption, ImageSource, Model } from "../common/model";
+
+export interface FaceRecognitionPredictOption extends ImageCropOption { }
+
+export abstract class FaceRecognition extends Model {
+	public abstract doPredict(image: cv.Mat, option?: FaceRecognitionPredictOption): Promise<number[]>;
+
+	public async predict(image: ImageSource, option?: FaceRecognitionPredictOption) { return Model.resolveImage(image, im => this.doPredict(im, option)); }
+}
+
+export function cosineDistance(lhs: number[], rhs: number[]) {
+	if (lhs.length !== rhs.length) throw new Error('length not match');
+
+	const getMod = (vec: number[]) => {
+		let sum = 0;
+		for (let i = 0; i < vec.length; ++i) sum += vec[i] * vec[i];
+		return sum ** 0.5;
+	}
+
+	let temp = 0;
+	for (let i = 0; i < lhs.length; ++i) temp += lhs[i] * rhs[i];
+	return temp / (getMod(lhs) * getMod(rhs));
+}
+
+export function euclideanDistance(lhs: number[], rhs: number[]) {
+	if (lhs.length !== rhs.length) throw new Error('length not match');
+	let sumDescriptor = 0;
+	for (let i = 0; i < lhs.length; i++) sumDescriptor += (lhs[i] - rhs[i]) ** 2;
+	return sumDescriptor ** 0.5;
+}
--- a/src/deploy/faceid/index.ts
+++ b/src/deploy/faceid/index.ts
@ -0,0 +1,3 @@
+export { cosineDistance, euclideanDistance } from "./common";
+export { ArcFace, CosFace, PartialFC } from "./insightface";
+export { AdaFace } from "./adaface";
--- a/src/deploy/faceid/insightface.ts
+++ b/src/deploy/faceid/insightface.ts
@ -0,0 +1,32 @@
+import { Mat } from "../../cv/mat";
+import { convertImage } from "../common/processors";
+import { FaceRecognition, FaceRecognitionPredictOption } from "./common";
+
+export class Insightface extends FaceRecognition {
+
+	public async doPredict(image: Mat, option?: FaceRecognitionPredictOption): Promise<number[]> {
+		const input = this.input;
+		const output = this.output;
+		if (option?.crop) image = image.crop(option.crop.sx, option.crop.sy, option.crop.sw, option.crop.sh);
+		image = image.resize(input.shape[3], input.shape[2]);
+		const nchwImageData = convertImage(image.data, { sourceImageFormat: "bgr", targetColorFormat: "bgr", targetShapeFormat: "nchw", targetNormalize: { mean: [127.5], std: [127.5] } });
+
+		const embedding = await this.session.run({
+			[input.name]: {
+				type: "float32",
+				data: nchwImageData,
+				shape: [1, 3, input.shape[2], input.shape[3]],
+			}
+		}).then(res => res[output.name]);
+
+		return new Array(...embedding);
+	}
+
+}
+
+export class ArcFace extends Insightface { }
+
+export class CosFace extends Insightface { }
+
+export class PartialFC extends Insightface { }
+
--- a/src/deploy/index.ts
+++ b/src/deploy/index.ts
@ -0,0 +1 @@
+export * as deploy from "./main";
--- a/src/deploy/main.ts
+++ b/src/deploy/main.ts
@ -0,0 +1,4 @@
+export * as facedet from "./facedet";
+export * as faceid from "./faceid";
+export * as faceattr from "./faceattr";
+export * as facealign from "./facealign";
--- a/src/index.ts
+++ b/src/index.ts
--- a/src/main.ts
+++ b/src/main.ts
--- a/src/test.ts
+++ b/src/test.ts
@ -0,0 +1,138 @@
+import fs from "fs";
+import { deploy } from "./deploy";
+import { cv } from "./cv";
+import { faceidTestData } from "./test_data/faceid";
+import path from "path";
+import crypto from "crypto";
+
+async function cacheImage(group: string, url: string) {
+	const _url = new URL(url);
+	const cacheDir = path.join(__dirname, "../cache/images", group);
+	fs.mkdirSync(cacheDir, { recursive: true });
+	const cacheJsonFile = path.join(cacheDir, "config.json");
+	let jsonData: Record<string, string> = {};
+	if (cacheJsonFile && fs.existsSync(cacheJsonFile)) {
+		jsonData = JSON.parse(fs.readFileSync(cacheJsonFile, "utf-8"));
+		const filename = jsonData[url];
+		if (filename && fs.existsSync(filename)) return path.join(cacheDir, filename);
+	}
+	const data = await fetch(_url).then(res => res.arrayBuffer()).then(buf => new Uint8Array(buf));
+	const allowedExtnames = [".jpg", ".jpeg", ".png", ".webp"];
+	let extname = path.extname(_url.pathname);
+	if (!allowedExtnames.includes(extname)) extname = ".jpeg";
+	const md5 = crypto.hash("md5", data, "hex");
+	const savename = md5 + extname;
+	jsonData[url] = savename;
+	fs.writeFileSync(cacheJsonFile, JSON.stringify(jsonData));
+	const savepath = path.join(cacheDir, savename);
+	fs.writeFileSync(savepath, data);
+	return savepath;
+}
+
+async function testGenderTest() {
+	const facedet = deploy.facedet.Yolov5Face.fromOnnx(fs.readFileSync("models/facedet/yolov5s.onnx"));
+	const detector = deploy.faceattr.GenderAgeDetector.fromOnnx(fs.readFileSync("models/faceattr/insight_gender_age.onnx"));
+
+	const image = await cv.Mat.load("https://b0.bdstatic.com/ugc/iHBWUj0XqytakT1ogBfBJwc7c305331d2cf904b9fb3d8dd3ed84f5.jpg");
+	const boxes = await facedet.predict(image);
+	if (!boxes.length) return console.error("未检测到人脸");
+	for (const [idx, box] of boxes.entries()) {
+		const res = await detector.predict(image, { crop: { sx: box.left, sy: box.top, sw: box.width, sh: box.height } });
+		console.log(`[${idx + 1}]`, res);
+	}
+
+}
+
+async function testFaceID() {
+	const facedet = deploy.facedet.Yolov5Face.fromOnnx(fs.readFileSync("models/facedet/yolov5s.onnx"));
+	const faceid = deploy.faceid.CosFace.fromOnnx(fs.readFileSync("models/faceid/insightface/glint360k_cosface_r100.onnx"));
+
+	const { basic, tests } = faceidTestData.stars;
+
+	console.log("正在加载图片资源");
+	const basicImage = await cv.Mat.load(await cacheImage("faceid", basic.image));
+	const testsImages: Record<string, cv.Mat[]> = {};
+	for (const [name, imgs] of Object.entries(tests)) {
+		testsImages[name] = await Promise.all(imgs.map(img => cacheImage("faceid", img).then(img => cv.Mat.load(img))));
+	}
+
+	console.log("正在检测基本数据");
+	const basicDetectedFaces = await facedet.predict(basicImage);
+	const basicFaceIndex: Record<string, number> = {};
+	for (const [name, [x, y]] of Object.entries(basic.faces)) {
+		basicFaceIndex[name] = basicDetectedFaces.findIndex(box => box.x1 < x && box.x2 > x && box.y1 < y && box.y2 > y);
+	}
+
+	const basicEmbds: number[][] = [];
+	for (const box of basicDetectedFaces) {
+		const embd = await faceid.predict(basicImage, { crop: { sx: box.left, sy: box.top, sw: box.width, sh: box.height } });
+		basicEmbds.push(embd);
+	}
+
+	console.log("正在进行人脸对比");
+	for (const [name, image] of Object.entries(testsImages)) {
+		console.log(`[${name}] 正在检测`);
+		const index = basicFaceIndex[name];
+		if (index < 0) {
+			console.error(`[${name}] 不存在`);
+			continue;
+		}
+		const basicEmbd = basicEmbds[index]
+
+		for (const [idx, img] of image.entries()) {
+			const box = await facedet.predict(img).then(boxes => boxes[0]);
+			if (!box) {
+				console.error(`[${idx + 1}] 未检测到人脸`);
+				continue
+			}
+
+			const embd = await faceid.predict(img, { crop: { sx: box.left, sy: box.top, sw: box.width, sh: box.height } });
+
+			const compareEmbds = basicEmbds.map(e => deploy.faceid.cosineDistance(e, embd));
+			const max = Math.max(...compareEmbds);
+			const min = Math.min(...compareEmbds);
+
+			const distance = deploy.faceid.cosineDistance(basicEmbd, embd);
+			console.log(`[${idx + 1}] [${(distance.toFixed(4) == max.toFixed(4)) ? '\x1b[102m成功' : '\x1b[101m失败'}\x1b[0m] 相似度:${distance.toFixed(4)}, 最大:${max.toFixed(4)}, 最小:${min.toFixed(4)}`);
+		}
+	}
+
+}
+
+async function testFaceAlign() {
+	const fd = deploy.facedet.Yolov5Face.fromOnnx(fs.readFileSync("models/facedet/yolov5s.onnx"));
+	// const fa = deploy.facealign.PFLD.fromOnnx(fs.readFileSync("models/facealign/pfld-106-lite.onnx"));
+	const fa = deploy.facealign.FaceLandmark1000.fromOnnx(fs.readFileSync("models/facealign/FaceLandmark1000.onnx"));
+	let image = await cv.Mat.load("https://bkimg.cdn.bcebos.com/pic/d52a2834349b033b5bb5f183119c21d3d539b6001712");
+	image = image.rotate(image.width / 2, image.height / 2, 0);
+
+	const face = await fd.predict(image).then(res => res[0].toSquare());
+	const points = await fa.predict(image, { crop: { sx: face.left, sy: face.top, sw: face.width, sh: face.height } });
+
+	points.points.forEach((point, idx) => {
+		image.circle(face.left + point.x, face.top + point.y, 2);
+	})
+	// const point = points.getPointsOf("rightEye")[1];
+	// image.circle(face.left + point.x, face.top + point.y, 2);
+	fs.writeFileSync("testdata/xx.jpg", image.encode(".jpg"));
+
+	let faceImage = image.rotate(face.centerX, face.centerY, -points.direction * 180 / Math.PI);
+	faceImage = faceImage.crop(face.left, face.top, face.width, face.height);
+	fs.writeFileSync("testdata/face.jpg", faceImage.encode(".jpg"));
+
+	console.log(points);
+	console.log(points.direction * 180 / Math.PI);
+	debugger
+}
+
+
+async function test() {
+	// testGenderTest();
+	// testFaceID();
+	testFaceAlign();
+}
+
+test().catch(err => {
+	console.error(err);
+	debugger
+});
--- a/src/test_data/faceid.ts
+++ b/src/test_data/faceid.ts
@ -0,0 +1,70 @@
+
+interface StarData {
+	basic: { image: string, faces: Record<string, [x: number, y: number]> }
+	tests: Record<string, string[]>
+}
+
+const stars: StarData = {
+	basic: {
+		image: "https://i0.hdslb.com/bfs/archive/64e47ec9fdac9e24bc2b49b5aaad5560da1bfe3e.jpg",
+		faces: {
+			"huge": [758, 492],
+			"yangmi": [1901, 551],
+			"yangying": [2630, 521],
+			"liuyifei": [353, 671],
+			"dengjiajia": [1406, 597],
+		}
+	},
+	tests: {
+		"huge": [
+			"https://p4.itc.cn/images01/20231025/539a0095f34a47f0b6e7ebc8dca43967.png",
+			"https://p6.itc.cn/q_70/images03/20230517/bc9abf4b1d2f462390f9d5f4d799e102.jpeg",
+			"https://bj.bcebos.com/bjh-pixel/1703489647650979543_1_ainote_new.jpg",
+			"https://pic.rmb.bdstatic.com/bjh/beautify/e7eb49c5097c757f068b4dc4b4140a99.jpeg",
+			"https://q4.itc.cn/images01/20240922/0e27ce021504496fb33e428b5a6eb09d.jpeg",
+			"https://q6.itc.cn/images01/20241111/8d2eb1503c0f43129943d8a5f5b84291.jpeg",
+			"https://q0.itc.cn/images01/20250120/b0910e8c37a341e290ae205c6a930e11.jpeg",
+			"https://n.sinaimg.cn/sinacn20107/320/w2048h3072/20190107/4e5b-hrfcctn3800719.jpg"
+		],
+		"yangmi": [
+			"https://q1.itc.cn/images01/20240221/4044fff01df4480d841d8a3923869455.jpeg",
+			"https://b0.bdstatic.com/7f7d30e4ce392a11a3612e8c0c1970b0.jpg",
+			"https://b0.bdstatic.com/c157a78f9302d0538c3dd22fef2659ce.jpg",
+			"https://q5.itc.cn/images01/20240419/cb15f51e65e5440f92b0f36298f64643.jpeg",
+			"https://pic.rmb.bdstatic.com/bjh/240423/b5e5aa734b1b80e93b36b7b4250dae887703.jpeg",
+			"https://q7.itc.cn/images01/20240316/297474bdc779495a8f4c49825ff4af98.jpeg",
+			"https://p8.itc.cn/q_70/images03/20230426/dfdae05508aa4d6caa566e0a29c70501.jpeg",
+			"https://pic.rmb.bdstatic.com/bjh/8ca1d31655cc109d363b88dded23bfa03807.jpeg",
+		],
+		"yangying": [
+			"https://q9.itc.cn/images01/20240401/e59294e8d51140ef95a32ac15a18f1c5.jpeg",
+			"https://q2.itc.cn/images01/20240401/8c7266ed665140889054aa029b441948.jpeg",
+			"https://q7.itc.cn/images01/20240327/3b34d9fdcd5249489c91bff44e1b5f67.jpeg",
+			"https://p6.itc.cn/images01/20230111/766db970998e44baa0c52a4fe32c8d73.jpeg",
+			"https://bj.bcebos.com/bjh-pixel/1699070679633105560_0_ainote_new.jpg",
+			"https://p6.itc.cn/images01/20230217/556c66340432485ea9e1fe53109716ee.jpeg",
+			"https://img-nos.yiyouliao.com/e13ca727b210046d7dfe49943e167525.jpeg",
+			"https://p8.itc.cn/q_70/images03/20230614/d9c37a45350543db850e26b1712cb4b2.jpeg",
+		],
+		"liuyifei": [
+			"https://pic1.zhimg.com/v2-f8517e0d3d925640b6c8cc53068906f1_r.jpg",
+			"https://q8.itc.cn/q_70/images03/20240906/c296907327c44c3db0ea2232d98e5b41.png",
+			"https://q0.itc.cn/q_70/images03/20240706/dd0aded7edc94fbcad8175fcb7111d89.jpeg",
+			"https://q8.itc.cn/images01/20241002/561d2334b0e0451f97261292fcf66544.jpeg",
+			"https://q0.itc.cn/images01/20241109/8b02037be3c6403aa0dee761f7fc3841.jpeg",
+			"https://b0.bdstatic.com/ugc/M0gY3M_9OvzSG6xuTniCqQaa50a2e9a3f8d275158a90a8e448c237.jpg",
+			"https://q2.itc.cn/images01/20241002/cd77b7cb8f2044faaa46f75a1f392a50.jpeg",
+			"https://q0.itc.cn/images01/20241110/a22ba19b0a944eb28066b602378e2d45.jpeg",
+		],
+		"dengjiajia":[
+			"https://q4.itc.cn/q_70/images01/20240601/db61f410a20b4155b2e487b183372fc1.jpeg",
+			"https://b0.bdstatic.com/ugc/sR1WfaiiWi2KtStV_U3YGw49f741338ad3b10c10a1dec7aa5d8dd8.jpg",
+			"https://bkimg.cdn.bcebos.com/pic/b8389b504fc2d56285357c05334187ef76c6a6efc680",
+			"https://bkimg.cdn.bcebos.com/pic/b2de9c82d158ccbfc3fa73271ed8bc3eb135416d",
+			"https://bkimg.cdn.bcebos.com/pic/2cf5e0fe9925bc315c6099498a8f9ab1cb134854da9b",
+			"https://bkimg.cdn.bcebos.com/pic/738b4710b912c8fcc3ce2e773f578545d688d43f8b76"
+		]
+	}
+}
+
+export const faceidTestData = { stars }
--- a/src/utils/utils.ts
+++ b/src/utils/utils.ts
@ -0,0 +1,33 @@
+
+export namespace utils {
+
+	export function rgba2rgb<T extends Uint8Array | Float32Array>(data: T): T {
+		const pixelCount = data.length / 4;
+		const result = new (data.constructor as any)(pixelCount * 3) as T;
+		for (let i = 0; i < pixelCount; i++) {
+			result[i * 3 + 0] = data[i * 4 + 0];
+			result[i * 3 + 1] = data[i * 4 + 1];
+			result[i * 3 + 2] = data[i * 4 + 2];
+		}
+		return result;
+	}
+
+	export function rgb2bgr<T extends Uint8Array | Float32Array>(data: T): T {
+		const pixelCount = data.length / 3;
+		const result = new (data.constructor as any)(pixelCount * 3) as T;
+		for (let i = 0; i < pixelCount; i++) {
+			result[i * 3 + 0] = data[i * 3 + 2];
+			result[i * 3 + 1] = data[i * 3 + 1];
+			result[i * 3 + 2] = data[i * 3 + 0];
+		}
+		return result;
+	}
+
+	export function normalize(data: Uint8Array | Float32Array, mean: number[], std: number[]): Float32Array {
+		const result = new Float32Array(data.length);
+		for (let i = 0; i < data.length; i++) {
+			result[i] = (data[i] - mean[i % mean.length]) / std[i % std.length];
+		}
+		return result;
+	}
+}
				`@ -0,0 +1 @@`
				`export { OrtSession as Session } from "./session";`
				`@ -0,0 +1 @@`
				`export { GenderAge as GenderAgeDetector } from "./gender-age";`