feat: 新增人脸检测API和人脸检测测试脚本，并更新 API 文档。

2026-02-11 11:21:19 +08:00 · 2026-02-11 11:21:19 +08:00 · b5d0a66249
parent e0af18b363
commit b5d0a66249
8 changed files with 251 additions and 1 deletions
--- a/API_DOCUMENTATION.md
+++ b/API_DOCUMENTATION.md
@ -222,3 +222,39 @@
 *   **接口地址**: `/health`
 *   **请求方式**: `GET`
 *   **返回结果**: `{"status": "healthy", "service": "Face Feature Extractor"}`
 ### 2.3 人脸检测 (获取坐标)
 *   **接口地址**: `/api/detect_face`
 *   **请求方式**: `POST`
 *   **请求类型**: `multipart/form-data`
 *   **请求参数**:
    | 参数名 | 类型 | 必填 | 说明 |
    | :--- | :--- | :--- | :--- |
    | image | File | 是 | 图片文件 |
    | expand_scale | Float | 否 | 扩充比例，默认 0.0。例如 0.3 表示长宽各扩充 30% |
 *   **返回结果**:
    > **坐标说明**:
    > *   `x1`, `y1`: 人脸检测框 **左上角** 的像素坐标。
    > *   `x2`, `y2`: 人脸检测框 **右下角** 的像素坐标。
    > *   `score`: 检测置信度 (0-1之间)。
    > *   **注意**: 即使设置了 `expand_scale`，返回的坐标也会被限制在图片边界内 (Clip to bounds)。
    ```json
    {
        "success": true,
        "message": "Success",
        "faces": [
            {
                "x1": 100.0,
                "y1": 50.0,
                "x2": 200.0,
                "y2": 150.0,
                "score": 0.98
            }
        ],
        "processing_time": 0.02
    }
    ```
--- a/FaceFeatureExtractorAPI/feature_server.py
+++ b/FaceFeatureExtractorAPI/feature_server.py
@ -5,7 +5,7 @@
 """
 import uvicorn
-from fastapi import FastAPI, File, UploadFile, HTTPException
+from fastapi import FastAPI, File, UploadFile, HTTPException, Form
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
 from typing import List, Optional
@ -118,6 +118,94 @@ async def extract_feature(image: UploadFile = File(...)):
            message=f"Server error: {str(e)}"
        )
 # 新增人脸检测响应模型
 class FaceRect(BaseModel):
    x1: float
    y1: float
    x2: float
    y2: float
    score: float
 class DetectFaceResponse(BaseModel):
    success: bool
    message: str
    faces: List[FaceRect] = []
    processing_time: Optional[float] = None
@app.post("/api/detect_face", response_model=DetectFaceResponse)
 async def detect_face(image: UploadFile = File(...), expand_scale: float = Form(0.0)):
    """
    人脸检测接口
    输入: 图片文件, 扩充比例(expand_scale)
    输出: 人脸坐标列表 (x1, y1, x2, y2)
    """
    import time
    start_time = time.time()
    try:
        img = decode_image(image)
        if img is None:
            raise HTTPException(status_code=400, detail="Invalid image file")
        # 获取图片尺寸用于坐标截断
        h_img, w_img = img.shape[:2]
        ext = get_extractor()
        # 直接调用检测器，不进行旋转校正，保证坐标对应原图
        boxes = ext.detect_faces(img)
        face_rects = []
        if boxes:
            for box in boxes:
                # 原始坐标
                x1 = float(box.x1)
                y1 = float(box.y1)
                x2 = float(box.x2)
                y2 = float(box.y2)
                # 应用扩充逻辑 (如果 expand_scale > 0)
                if expand_scale > 0:
                    w = x2 - x1
                    h = y2 - y1
                    cx = x1 + w / 2
                    cy = y1 + h / 2
                    new_w = w * (1 + expand_scale)
                    new_h = h * (1 + expand_scale)
                    x1 = cx - new_w / 2
                    y1 = cy - new_h / 2
                    x2 = cx + new_w / 2
                    y2 = cy + new_h / 2
                # 强制限制坐标在图片范围内，防止出现负数或越界
                x1 = max(0.0, min(x1, float(w_img)))
                y1 = max(0.0, min(y1, float(h_img)))
                x2 = max(0.0, min(x2, float(w_img)))
                y2 = max(0.0, min(y2, float(h_img)))
                face_rects.append(FaceRect(
                    x1=x1,
                    y1=y1,
                    x2=x2,
                    y2=y2,
                    score=float(box.score)
                ))
        return DetectFaceResponse(
            success=True if face_rects else False,
            message="Success" if face_rects else "No face detected",
            faces=face_rects,
            processing_time=time.time() - start_time
        )
    except Exception as e:
        logger.error(f"Detection failed: {e}", exc_info=True)
        return DetectFaceResponse(
            success=False,
            message=f"Server error: {str(e)}",
            processing_time=time.time() - start_time
        )
 if __name__ == "__main__":
    import argparse
    parser = argparse.ArgumentParser(description='Face Feature Extraction Microservice')
--- a/face_crop_1_scale_0.3.jpg
+++ b/face_crop_1_scale_0.3.jpg
--- a/face_crop_1_scale_0.6.jpg
+++ b/face_crop_1_scale_0.6.jpg
--- a/result_detected.jpg
+++ b/result_detected.jpg
--- a/result_detected_scale_0.3.jpg
+++ b/result_detected_scale_0.3.jpg
--- a/result_detected_scale_0.6.jpg
+++ b/result_detected_scale_0.6.jpg
--- a/test_detect_face.py
+++ b/test_detect_face.py
@ -0,0 +1,126 @@
 import requests
 import cv2
 import numpy as np
 import os
 import json
 import argparse
 import sys
 # 配置服务地址
 PYTHON_ALGO_URL = "http://192.168.0.37:18000"
 def get_default_image_path():
    """获取一个默认存在的测试图片路径"""
    # 尝试找一个存在的真实图片
    potential_paths = [
        r"C:\Users\24830\Desktop\人脸.jpg",
    ]
    for path in potential_paths:
        if os.path.exists(path):
            return path
    return None
 def detect_and_draw(image_path, expand_scale=0.0):
    url = f"{PYTHON_ALGO_URL}/api/detect_face"
    print(f"\n[Processing] Image: {image_path}")
    print(f"[API URL] {url}")
    print(f"[Expand Scale] {expand_scale}")
    if not os.path.exists(image_path):
        print(f"❌ Error: Image file not found: {image_path}")
        return
    try:
        # 1. 准备发送请求
        # 读取图片用于显示/画框
        img_array = np.fromfile(image_path, dtype=np.uint8)
        original_img = cv2.imdecode(img_array, cv2.IMREAD_COLOR)
        if original_img is None:
             print(f"❌ Error: Failed to read image using opencv: {image_path}")
             return
        # 2. 调用API
        data = {'expand_scale': expand_scale}
        with open(image_path, 'rb') as f:
            files = {'image': f}
            # 注意: 使用 data=data 发送表单数据，而不是 params=params (查询参数)
            response = requests.post(url, files=files, data=data, timeout=10)
        if response.status_code != 200:
            print(f"❌ Failed: Status {response.status_code}, Response: {response.text}")
            return
        result = response.json()
        print("\n=== API Response ===")
        print(json.dumps(result, indent=2))
        # 3. 处理结果并画图
        if result.get('success'):
            faces = result.get('faces', [])
            count = len(faces)
            print(f"\n✅ Success: Detected {count} faces.")
            # 创建副本用于画图
            draw_img = original_img.copy()
            for i, face in enumerate(faces):
                x1 = int(face['x1'])
                y1 = int(face['y1'])
                x2 = int(face['x2'])
                y2 = int(face['y2'])
                score = face['score']
                # 画矩形框
                # 颜色 (B, G, R) - 绿色
                color = (0, 255, 0)
                thickness = 2
                cv2.rectangle(draw_img, (x1, y1), (x2, y2), color, thickness)
                # 写文字
                label = f"Face {i+1}: {score:.2f}"
                cv2.putText(draw_img, label, (x1, y1 - 10), 
                           cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2)
                print(f"  - Face {i+1}: Box({x1}, {y1}, {x2}, {y2}), Score: {score:.4f}")
                # 保存裁剪的人脸图观察效果
                face_crop = original_img[y1:y2, x1:x2]
                if face_crop.size > 0:
                    crop_filename = f"face_crop_{i+1}_scale_{expand_scale}.jpg"
                    cv2.imencode('.jpg', face_crop)[1].tofile(crop_filename)
                    print(f"    Saved crop: {crop_filename}")
            # 4. 保存结果图
            output_filename = f"result_detected_scale_{expand_scale}.jpg"
            cv2.imencode('.jpg', draw_img)[1].tofile(output_filename)
            print(f"\n✅ Result image saved to: {os.path.abspath(output_filename)}")
        else:
            print(f"⚠️ API logic returned failure: {result.get('message')}") 
    except Exception as e:
        print(f"❌ Error: {e}")
        import traceback
        traceback.print_exc()
 if __name__ == "__main__":
    parser = argparse.ArgumentParser(description='Face Detection API Test Script')
    parser.add_argument('image_path', nargs='?', help='Path to the image file')
    parser.add_argument('--scale', type=float, default=0.6, help='Expand scale (default: 0.0)')
    args = parser.parse_args()
    target_path = args.image_path
    if not target_path:
        default_path = get_default_image_path()
        if default_path:
            print(f"No image path provided, using default found: {default_path}")
            target_path = default_path
        else:
            print("Usage: python test_detect_face.py <path_to_image> [--scale 0.3]")
            print("Error: No image path provided and no default test image found.")
            sys.exit(1)
    detect_and_draw(target_path, args.scale)