From 9f87f90af95dc841865c340457773379d6e1e7d3 Mon Sep 17 00:00:00 2001
From: guanyuankai <whistle_op@hotmail.com>
Date: Fri, 31 Oct 2025 10:14:51 +0800
Subject: [PATCH] =?UTF-8?q?=E5=AE=8C=E6=88=90so=E5=BA=93=E7=9A=84=E4=BB=A3?=
 =?UTF-8?q?=E7=A0=81?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .vscode/settings.json |  43 ++-
 CMakeLists.txt        |   3 -
 include/face_sdk.h    |  73 +++--
 src/face_pipeline.cpp | 666 ++++++++++++++++++++++++++++++++++++------
 src/face_pipeline.h   | 177 ++++++++---
 src/face_sdk_api.cpp  |  66 +++++
 src/face_sdk_jni.cpp  | 184 ++++++++++++
 7 files changed, 1055 insertions(+), 157 deletions(-)
diff --git a/.vscode/settings.json b/.vscode/settings.json
index 51b29f5..5ff2746 100644
--- a/.vscode/settings.json
+++ b/.vscode/settings.json
@@ -14,5 +14,46 @@
     "ANDROID_PLATFORM": "android-24"
   },
 
-  "cmake.buildDirectory": "${workspaceFolder}/out/build/android-arm64-v8a-Debug"
+  "cmake.buildDirectory": "${workspaceFolder}/out/build/android-arm64-v8a-Debug",
+  "files.associations": {
+    "algorithm": "cpp",
+    "cmath": "cpp",
+    "__bit_reference": "cpp",
+    "__hash_table": "cpp",
+    "__locale": "cpp",
+    "__node_handle": "cpp",
+    "__split_buffer": "cpp",
+    "__verbose_abort": "cpp",
+    "array": "cpp",
+    "cctype": "cpp",
+    "clocale": "cpp",
+    "cstdarg": "cpp",
+    "cstddef": "cpp",
+    "cstdint": "cpp",
+    "cstdio": "cpp",
+    "cstdlib": "cpp",
+    "cstring": "cpp",
+    "ctime": "cpp",
+    "cwchar": "cpp",
+    "execution": "cpp",
+    "memory": "cpp",
+    "initializer_list": "cpp",
+    "ios": "cpp",
+    "iosfwd": "cpp",
+    "iostream": "cpp",
+    "istream": "cpp",
+    "limits": "cpp",
+    "locale": "cpp",
+    "map": "cpp",
+    "mutex": "cpp",
+    "new": "cpp",
+    "stdexcept": "cpp",
+    "streambuf": "cpp",
+    "string": "cpp",
+    "string_view": "cpp",
+    "typeinfo": "cpp",
+    "unordered_map": "cpp",
+    "variant": "cpp",
+    "vector": "cpp"
+  }
 }
diff --git a/CMakeLists.txt b/CMakeLists.txt
index e7bcf12..fbc75f8 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -107,13 +107,10 @@ target_include_directories(face_sdk_jni PUBLIC
 # 7. é“¾æŽ¥åº“
 # -----------------------------------------------------------------
 target_link_libraries(face_sdk_jni
-    # OpenCV åº“
     ${OpenCV_LIBS}
 
-    # ONNX Runtime åº“
     onnxruntime
 
-    # Android NDK åº“
     log             # ç”¨äºŽ __android_log_print
     android         # ç”¨äºŽ AConfiguration, AAssetManager ç­‰
     jnigraphics     # ç”¨äºŽ Android Bitmap æ“ä½œ
diff --git a/include/face_sdk.h b/include/face_sdk.h
index a748da6..7464a2d 100644
--- a/include/face_sdk.h
+++ b/include/face_sdk.h
@@ -2,66 +2,65 @@
 
 #include <vector>
 #include <string>
+#include "opencv2/opencv.hpp" // æˆ‘ä»¬åœ¨æŽ¥å£ä¸­éœ€è¦ cv::Mat
 
-// ±ÜÃâÔÚÍ·ÎÄ¼þÖÐ±©Â¶ÍêÕûµÄ OpenCV Í·£¬Ê¹ÓÃÇ°ÏòÉùÃ÷
-namespace cv {
-    class Mat;
-}
-
-// SDK ×´Ì¬Âë
+// å®šä¹‰ SDK çŠ¶æ€ç 
 enum class SDKStatus {
     SUCCESS = 0,
-    MODEL_LOAD_ERROR = -1,
-    EXTRACTION_ERROR = -2,
-    NO_FACE_DETECTED = -3,
-    POOR_QUALITY = -4,
-    INVALID_INPUT = -5
+    MODEL_LOAD_ERROR = -1, // æ¨¡åž‹åŠ è½½å¤±è´¥
+    PIPELINE_ERROR = -2,   // ç®¡çº¿ï¼ˆç®—æ³•ï¼‰æ‰§è¡Œå¤±è´¥
+    INVALID_INPUT = -3,    // æ— æ•ˆè¾“å…¥ï¼ˆå¦‚ç©ºå›¾åƒï¼‰
+    NOT_INITIALIZED = -4 // SDK æœªåˆå§‹åŒ–
 };
 
-// ÌØÕ÷ÌáÈ¡½á¹û
-struct FeatureResult {
+// ç‰¹å¾æå–çš„ç»“æžœç»“æž„ä½“
+struct SDKExtractResult {
     SDKStatus status;
-    std::vector<float> feature; // 512Î¬ÌØÕ÷
-    std::string error_message;
+    std::vector<float> feature;
+    std::string message;
 };
 
-// ¡¾ºê¹Û¼Ü¹¹ºËÐÄ¡¿
-// FaceSDK Àà£¬Ìá¹©¸ø C++ µ÷ÓÃ
+/**
+ * @class FaceSDK
+ * @brief å°è£…äº† FacePipeline çš„ C++ API (ä½¿ç”¨ Pimpl æƒ¯ç”¨æ³•)
+ * * è¿™æ˜¯ JNI å±‚å°†è¦è°ƒç”¨çš„æŽ¥å£
+ */
 class FaceSDK {
 public:
     /**
-     * @brief ¹¹Ôìº¯Êý£º³õÊ¼»¯SDK£¬¼ÓÔØÄ£ÐÍ
-     * @param model_dir ´æ·Å7¸öonnxÎÄ¼þµÄÄ¿Â¼Â·¾¶
+     * @brief æž„é€ å‡½æ•°ï¼ŒåŠ è½½æ¨¡åž‹
+     * @param model_dir åŒ…å« .onnx æ–‡ä»¶çš„ç›®å½•
      */
     FaceSDK(const std::string& model_dir);
 
     /**
-     * @brief Îö¹¹º¯Êý£ºÊÍ·Å×ÊÔ´
+     * @brief æžæž„å‡½æ•°
      */
     ~FaceSDK();
 
     /**
-     * @brief ½Ó¿Ú1£ºÌáÈ¡Í¼Æ¬ÌØÕ÷Öµ
-     * @param image ÊäÈëÍ¼Ïñ (OpenCV Mat, BGR ¸ñÊ½)
-     * @return FeatureResult ½á¹¹Ìå£¬°üº¬×´Ì¬ºÍÌØÕ÷ÏòÁ¿
+     * @brief æ£€æŸ¥ SDK æ˜¯å¦æˆåŠŸåˆå§‹åŒ–
      */
-    FeatureResult extractFeature(const cv::Mat& image);
+    bool IsInitialized() const;
 
     /**
-     * @brief ½Ó¿Ú2£º±È½ÏÁ½¸öÌØÕ÷Öµ (¾²Ì¬º¯Êý)
-     * @param feature1 ÌØÕ÷ÏòÁ¿1
-     * @param feature2 ÌØÕ÷ÏòÁ¿2
-     * @return ÏàËÆ¶È (0.0 ~ 1.0)£¬ÓàÏÒÏàËÆ¶È
+     * @brief æå–äººè„¸ç‰¹å¾
+     * @param image BGR æ ¼å¼çš„ cv::Mat å›¾åƒ
+     * @return SDKExtractResult åŒ…å«çŠ¶æ€å’Œç‰¹å¾å‘é‡
      */
-    static float compareFeatures(const std::vector<float>& feature1,
-        const std::vector<float>& feature2);
+    SDKExtractResult ExtractFeature(const cv::Mat& image);
+
+    /**
+     * @brief æ¯”è¾ƒä¸¤ä¸ªç‰¹å¾å‘é‡
+     * @param feat1 ç‰¹å¾1
+     * @param feat2 ç‰¹å¾2
+     * @return ä½™å¼¦ç›¸ä¼¼åº¦
+     */
+    float Compare(const std::vector<float>& feat1, const std::vector<float>& feat2);
 
 private:
-    // PImpl Ä£Ê½ (Pointer to Implementation)
-    // ÕâÊÇÒ»¸ö¸ß¼¶ C++ ¼¼ÇÉ£¬ÓÃÓÚÒþ²ØËùÓÐÄÚ²¿ÊµÏÖÏ¸½Ú
-    // (Èç FacePipeline, ONNX Runtime, OpenCV µÄ³ÉÔ±±äÁ¿)£¬
-    // Ê¹µÃÕâ¸öÍ·ÎÄ¼þ·Ç³£¸É¾»£¬²¢ÇÒ±àÒëËÙ¶È¸ü¿ì¡£
+    // Pimpl (Private Implementation)
+    // "Impl" æ˜¯ä¸€ä¸ªå‰å‘å£°æ˜Žçš„ç§æœ‰ç±»
     class Impl;
-    Impl* p_impl;
-};
-
+    std::unique_ptr<Impl> m_impl;
+};
\ No newline at end of file
diff --git a/src/face_pipeline.cpp b/src/face_pipeline.cpp
index 7ea7ec2..34b9995 100644
--- a/src/face_pipeline.cpp
+++ b/src/face_pipeline.cpp
@@ -1,88 +1,596 @@
 #include "face_pipeline.h"
-#include <iostream> // ç”¨äºŽæ—¥å¿—
+#include <vector>
+#include <string>
 
-// æž„é€ å‡½æ•°ï¼šåˆå§‹åŒ–ORTçŽ¯å¢ƒã€ä¼šè¯é€‰é¡¹ï¼Œå¹¶åŠ è½½æ¨¡åž‹
+// æž„é€ å‡½æ•°
 FacePipeline::FacePipeline(const std::string& model_dir)
-    : m_env(ORT_LOGGING_LEVEL_WARNING, "FaceSDK") // åˆå§‹åŒ–ORTçŽ¯å¢ƒ
+    : m_env(ORT_LOGGING_LEVEL_WARNING, "FaceSDK"),
+      m_memory_info(Ort::MemoryInfo::CreateCpu(OrtArenaAllocator, OrtMemTypeDefault))
 {
-    // é…ç½®ä¼šè¯é€‰é¡¹
-    m_session_options.SetIntraOpNumThreads(1); // ç§»åŠ¨ç«¯é€šå¸¸è®¾ç½®ä¸º1
+    m_session_options.SetIntraOpNumThreads(4); // ä½¿ç”¨4çº¿ç¨‹
     m_session_options.SetGraphOptimizationLevel(GraphOptimizationLevel::ORT_ENABLE_ALL);
 
-    // ç«‹å³åŠ è½½æ¨¡åž‹
     m_initialized = LoadModels(model_dir);
-
     if (m_initialized) {
-        std::cout << "FacePipeline initialized successfully." << std::endl;
+        InitMemoryAllocators();
+        LOGI("FacePipeline initialized successfully.");
     } else {
-        std::cerr << "FacePipeline initialization failed." << std::endl;
+        LOGE("FacePipeline initialization failed.");
     }
 }
 
-// æžæž„å‡½æ•° (ç”±äºŽä½¿ç”¨unique_ptr, èµ„æºä¼šè‡ªåŠ¨é‡Šæ”¾)
 FacePipeline::~FacePipeline() {}
 
-
 // (ç§æœ‰) åŠ è½½æ‰€æœ‰æ¨¡åž‹
 bool FacePipeline::LoadModels(const std::string& model_dir) {
-    try {
-        // ã€ã€ä¿®æ­£ç‚¹ã€‘ã€‘:
-        // æˆ‘ä»¬ä¸å†ä½¿ç”¨ to_wstring()ã€‚
-        // æˆ‘ä»¬ç›´æŽ¥ä½¿ç”¨ .c_str()ï¼Œå› ä¸ºAndroid APIéœ€è¦ const char*
-        
-        // 1. äººè„¸æ£€æµ‹
-        std::string detector_path = model_dir + "/faceboxesv2-640x640.onnx";
-        m_session_detector = std::make_unique<Ort::Session>(m_env, detector_path.c_str(), m_session_options);
-        std::cout << "Loaded model: " << detector_path << std::endl;
+    auto load_session = [&](std::unique_ptr<Ort::Session>& session, const std::string& model_name) {
+        std::string model_path = model_dir + "/" + model_name;
+        try {
+            session = std::make_unique<Ort::Session>(m_env, model_path.c_str(), m_session_options);
+            LOGI("Loaded model: %s", model_path.c_str());
+        } catch (const Ort::Exception& e) {
+            LOGE("Error loading model %s: %s", model_path.c_str(), e.what());
+            return false;
+        }
+        return true;
+    };
 
-        // 2. å…³é”®ç‚¹ (Net1)
-        std::string lm1_path = model_dir + "/face_landmarker_pts5_net1.onnx";
-        m_session_landmarker1 = std::make_unique<Ort::Session>(m_env, lm1_path.c_str(), m_session_options);
-        std::cout << "Loaded model: " << lm1_path << std::endl;
+    if (!load_session(m_session_rotator, "model_gray_mobilenetv2_rotcls.onnx")) return false;
+    if (!load_session(m_session_detector, "faceboxesv2-640x640.onnx")) return false;
+    if (!load_session(m_session_pose_var, "fsanet-var.onnx")) return false;
+    if (!load_session(m_session_pose_conv, "fsanet-conv.onnx")) return false;
+    if (!load_session(m_session_landmarker1, "face_landmarker_pts5_net1.onnx")) return false;
+    if (!load_session(m_session_landmarker2, "face_landmarker_pts5_net2.onnx")) return false;
+    if (!load_session(m_session_recognizer, "face_recognizer.onnx")) return false;
 
-        // 3. å…³é”®ç‚¹ (Net2)
-        std::string lm2_path = model_dir + "/face_landmarker_pts5_net2.onnx";
-        m_session_landmarker2 = std::make_unique<Ort::Session>(m_env, lm2_path.c_str(), m_session_options);
-        std::cout << "Loaded model: " << lm2_path << std::endl;
-
-        // 4. äººè„¸è¯†åˆ«
-        std::string rec_path = model_dir + "/face_recognizer.onnx";
-        m_session_recognizer = std::make_unique<Ort::Session>(m_env, rec_path.c_str(), m_session_options);
-        std::cout << "Loaded model: " << rec_path << std::endl;
-        
-        // 5. æ—‹è½¬åˆ†ç±»
-        std::string rot_path = model_dir + "/model_gray_mobilenetv2_rotcls.onnx";
-        m_session_rotator = std::make_unique<Ort::Session>(m_env, rot_path.c_str(), m_session_options);
-        std::cout << "Loaded model: " << rot_path << std::endl;
-        
-        // 6. å§¿æ€ä¼°è®¡ (VAR)
-        std::string pose_var_path = model_dir + "/fsanet-var.onnx";
-        m_session_pose_var = std::make_unique<Ort::Session>(m_env, pose_var_path.c_str(), m_session_options);
-        std::cout << "Loaded model: " << pose_var_path << std::endl;
-        
-        // 7. å§¿æ€ä¼°è®¡ (CONV)
-        std::string pose_conv_path = model_dir + "/fsanet-conv.onnx";
-        m_session_pose_conv = std::make_unique<Ort::Session>(m_env, pose_conv_path.c_str(), m_session_options);
-        std::cout << "Loaded model: " << pose_conv_path << std::endl;
-
-    } catch (const Ort::Exception& e) {
-        // å¦‚æžœä»»ä½•æ¨¡åž‹åŠ è½½å¤±è´¥ï¼Œæ•èŽ·å¼‚å¸¸
-        std::cerr << "Error loading models: " << e.what() << std::endl;
-        return false;
-    }
-
-    std::cout << "All 7 models loaded successfully." << std::endl;
+    LOGI("All 7 models loaded successfully.");
     return true;
 }
 
-// L2 å½’ä¸€åŒ– (å°†åœ¨Extractä¸­ä½¿ç”¨)
-void FacePipeline::normalize_l2(std::vector<float>& v) {
+// (ç§æœ‰) èŽ·å–æ¨¡åž‹è¾“å…¥/è¾“å‡ºä¿¡æ¯
+void FacePipeline::InitMemoryAllocators() {
+    auto get_io_names = [&](Ort::Session* session,
+                            std::vector<const char*>& input_names,
+                            std::vector<const char*>& output_names,
+                            std::vector<int64_t>& input_shape) 
+    {
+        input_names.clear();
+        output_names.clear();
+        input_shape.clear();
+
+        for (size_t i = 0; i < session->GetInputCount(); ++i) {
+            auto input_name_ptr = session->GetInputNameAllocated(i, m_allocator);
+            input_names.push_back(strdup(input_name_ptr.get()));
+        }
+
+        for (size_t i = 0; i < session->GetOutputCount(); ++i) {
+            auto output_name_ptr = session->GetOutputNameAllocated(i, m_allocator);
+            output_names.push_back(strdup(output_name_ptr.get()));
+        }
+
+        auto input_type_info = session->GetInputTypeInfo(0);
+        auto tensor_info = input_type_info.GetTensorTypeAndShapeInfo();
+        input_shape = tensor_info.GetShape();
+        if (input_shape[0] < 1) input_shape[0] = 1;
+    };
+
+    get_io_names(m_session_rotator.get(), m_rot_input_names, m_rot_output_names, m_rot_input_shape);
+    get_io_names(m_session_detector.get(), m_det_input_names, m_det_output_names, m_det_input_shape);
+    get_io_names(m_session_pose_var.get(), m_pose_var_input_names, m_pose_var_output_names, m_pose_var_input_shape);
+    get_io_names(m_session_pose_conv.get(), m_pose_conv_input_names, m_pose_conv_output_names, m_pose_conv_input_shape);
+    get_io_names(m_session_landmarker1.get(), m_lm1_input_names, m_lm1_output_names, m_lm1_input_shape);
+    get_io_names(m_session_landmarker2.get(), m_lm2_input_names, m_lm2_output_names, m_lm2_input_shape);
+    get_io_names(m_session_recognizer.get(), m_rec_input_names, m_rec_output_names, m_rec_input_shape);
+    
+    // ç”Ÿæˆ FaceBoxesV2 çš„é”šç‚¹
+    generate_anchors_faceboxes(m_det_input_shape[2], m_det_input_shape[3]); // H, W (640, 640)
+    
+    // è°ƒæ•´Blobç¼“å†²åŒºå¤§å° (æŸ¥æ‰¾æœ€å¤§æ‰€éœ€size)
+    size_t max_blob_size = 0;
+    auto update_max = [&](const std::vector<int64_t>& shape) {
+        size_t s = std::accumulate(shape.begin() + 1, shape.end(), 1, std::multiplies<size_t>());
+        if (s > max_blob_size) max_blob_size = s;
+    };
+    update_max(m_rot_input_shape);
+    update_max(m_det_input_shape);
+    update_max(m_pose_var_input_shape);
+    update_max(m_lm1_input_shape);
+    update_max(m_rec_input_shape);
+    m_blob_buffer.resize(max_blob_size);
+}
+
+// --- å›¾åƒé¢„å¤„ç†è¾…åŠ©å‡½æ•° ---
+void FacePipeline::image_to_blob(const cv::Mat& img, std::vector<float>& blob, const float* mean, const float* std) {
+    int channels = img.channels();
+    int height = img.rows;
+    int width = img.cols;
+    
+    for (int c = 0; c < channels; c++) {
+        for (int h = 0; h < height; h++) {
+            for (int w = 0; w < width; w++) {
+                float val;
+                if (channels == 3) {
+                    val = static_cast<float>(img.at<cv::Vec3b>(h, w)[c]);
+                } else {
+                    val = static_cast<float>(img.at<uchar>(h, w));
+                }
+                blob[c * width * height + h * width + w] = (val - mean[c]) * std[c];
+            }
+        }
+    }
+}
+
+Ort::Value FacePipeline::create_tensor(const std::vector<float>& blob_data, const std::vector<int64_t>& input_shape) {
+    return Ort::Value::CreateTensor<float>(m_memory_info, 
+                                           const_cast<float*>(blob_data.data()), 
+                                           blob_data.size(), 
+                                           input_shape.data(), 
+                                           input_shape.size());
+}
+
+
+// --- æ ¸å¿ƒç®¡çº¿å®žçŽ° ---
+
+bool FacePipeline::Extract(const cv::Mat& image, std::vector<float>& feature) {
+    if (!m_initialized) {
+        LOGE("Extract failed: Pipeline is not initialized.");
+        return false;
+    }
+    if (image.empty()) {
+        LOGE("Extract failed: Input image is empty.");
+        return false;
+    }
+
+    // --- 1. æ—‹è½¬æ£€æµ‹ ---
+    int rot_angle_code = RunRotation(image);
+    cv::Mat upright_image;
+    if (rot_angle_code >= 0) {
+        cv::rotate(image, upright_image, rot_angle_code);
+    } else {
+        upright_image = image;
+    }
+
+    // --- 2. äººè„¸æ£€æµ‹ ---
+    std::vector<FaceBox> boxes;
+    if (!RunDetection(upright_image, boxes)) {
+        LOGI("Extract failed: No face detected.");
+        return false;
+    }
+    // (Python ä½¿ç”¨ topk=2, NMS åŽ boxes[0] å³æ˜¯æœ€ä½³)
+    FaceBox best_box = boxes[0];
+
+    // è£å‰ªäººè„¸ (ç”¨äºŽå§¿æ€å’Œå…³é”®ç‚¹)
+    // crop_face, (assess_quality)
+    // Python çš„ crop_face å®žçŽ°äº†å¸¦ padding çš„è£å‰ª
+    cv::Rect face_rect_raw(best_box.x1, best_box.y1, best_box.x2 - best_box.x1, best_box.y2 - best_box.y1);
+    int pad_top = std::max(0, -face_rect_raw.y);
+    int pad_bottom = std::max(0, (face_rect_raw.y + face_rect_raw.height) - upright_image.rows);
+    int pad_left = std::max(0, -face_rect_raw.x);
+    int pad_right = std::max(0, (face_rect_raw.x + face_rect_raw.width) - upright_image.cols);
+
+    cv::Mat face_crop_padded;
+    cv::copyMakeBorder(upright_image, face_crop_padded, pad_top, pad_bottom, pad_left, pad_right, cv::BORDER_CONSTANT, cv::Scalar(0,0,0));
+    cv::Rect face_rect_padded(face_rect_raw.x + pad_left, face_rect_raw.y + pad_top, face_rect_raw.width, face_rect_raw.height);
+    cv::Mat face_crop = face_crop_padded(face_rect_padded);
+
+
+    // --- 5. äººè„¸å¯¹é½ (åœ¨å§¿æ€æ£€æµ‹å‰ï¼Œå› ä¸ºå§¿æ€æ£€æµ‹éœ€è¦å¯¹é½çš„è„¸) ---
+    // (assess_quality) è°ƒç”¨ self.pose_checker.check(aligned_face)
+    // QualityOfPose.check()
+    // Landmark5er.inference() -> crop_face -> resize(112, 112)
+    // FaceAlign.align() -> 256x256
+    // 
+    // **é€»è¾‘å†²çª**: 
+    // face_feature_extractor.py L345 (assess_quality) è°ƒç”¨ pose_checker.check(aligned_face)
+    // ä½† L336 (align_face) ä¾èµ– landmarks
+    // ä½† L330 (extract_landmarks) ä¾èµ– boxes
+    // 
+    // **ä¿®æ­£**: Python æºç  L306 `QualityOfPose` æž„é€ å‡½æ•° -> L416 `check` -> L389 `detect_angle` -> L370 `transform`
+    // QualityOfPose.transform() æŽ¥æ”¶çš„æ˜¯ *æœªå¯¹é½* çš„è„¸éƒ¨è£å‰ª (L379 canvas[ny1:ny1 + h, nx1:nx1 + w] = mat)
+    // **æˆ‘çš„ C++ é€»è¾‘é”™äº†**ã€‚ å§¿æ€æ£€æµ‹ä¸éœ€è¦å¯¹é½çš„è„¸ï¼Œå®ƒéœ€è¦ *åŽŸå§‹è£å‰ª*ã€‚
+    
+    // --- 3. å§¿æ€ä¼°è®¡ (è´¨é‡è¿‡æ»¤) ---
+    FacePose pose;
+    if (!RunPose(face_crop, pose)) {
+        LOGI("Extract failed: Pose estimation failed.");
+        return false;
+    }
+
+    if (std::abs(pose.yaw) > m_pose_threshold || std::abs(pose.pitch) > m_pose_threshold) {
+        LOGI("Extract failed: Face pose (Y:%.1f, P:%.1f) exceeds threshold (%.1f)", pose.yaw, pose.pitch, m_pose_threshold);
+        return false;
+    }
+
+    // --- 4. å…³é”®ç‚¹æ£€æµ‹ ---
+    FaceLandmark landmark;
+    if (!RunLandmark(upright_image, best_box, landmark)) {
+        LOGI("Extract failed: Landmark detection failed.");
+        return false;
+    }
+
+    // --- 5. äººè„¸å¯¹é½ ---
+    cv::Mat aligned_face = RunAlignment(upright_image, landmark);
+
+    // --- 6. ç‰¹å¾æå– ---
+    if (!RunRecognition(aligned_face, feature)) {
+        LOGI("Extract failed: Feature recognition failed.");
+        return false;
+    }
+
+    // --- 7. å½’ä¸€åŒ– (åœ¨ RunRecognition å†…éƒ¨å®Œæˆ) ---
+    LOGI("Extract success.");
+    return true;
+}
+
+
+// --- æ­¥éª¤ 1: æ—‹è½¬æ£€æµ‹ (æ¥è‡ª face_feature_extractor.py) ---
+void FacePipeline::preprocess_rotation(const cv::Mat& image, std::vector<float>& blob_data) {
+    cv::Mat gray_img, resized, cropped, gray_3d;
+    cv::cvtColor(image, gray_img, cv::COLOR_BGR2GRAY);
+    cv::resize(gray_img, resized, cv::Size(256, 256), 0, 0, cv::INTER_LINEAR);
+    int start = (256 - 224) / 2;
+    cv::Rect crop_rect(start, start, 224, 224);
+    cropped = resized(crop_rect);
+    cv::cvtColor(cropped, gray_3d, cv::COLOR_GRAY2BGR);
+    
+    // å½’ä¸€åŒ–: / 255.0 (mean=[0,0,0], std=[1,1,1])
+    const float mean[3] = {0.0f, 0.0f, 0.0f};
+    const float std[3] = {1.0f / 255.0f, 1.0f / 255.0f, 1.0f / 255.0f}; // ä¹˜ä»¥ 1/255 ç­‰äºŽé™¤ä»¥ 255
+    image_to_blob(gray_3d, blob_data, mean, std);
+}
+
+int FacePipeline::RunRotation(const cv::Mat& image) {
+    preprocess_rotation(image, m_blob_buffer);
+    auto input_tensor = create_tensor(m_blob_buffer, m_rot_input_shape);
+    
+    auto output_tensors = m_session_rotator->Run(Ort::RunOptions{nullptr}, 
+                                                 m_rot_input_names.data(), &input_tensor, 1, 
+                                                 m_rot_output_names.data(), 1);
+    
+    float* output_data = output_tensors[0].GetTensorMutableData<float>();
+    int max_index = std::distance(output_data, std::max_element(output_data, output_data + 4));
+    
+    // (correct_image_rotation)
+    if (max_index == 1) return cv::ROTATE_90_CLOCKWISE;
+    if (max_index == 2) return cv::ROTATE_180;
+    if (max_index == 3) return cv::ROTATE_90_COUNTERCLOCKWISE;
+    return -1;
+}
+
+// --- æ­¥éª¤ 2: äººè„¸æ£€æµ‹ (æ¥è‡ª facedetector.py) ---
+void FacePipeline::preprocess_detection(const cv::Mat& img, std::vector<float>& blob_data) {
+    cv::Mat resized;
+    cv::resize(img, resized, cv::Size(m_det_input_shape[3], m_det_input_shape[2])); // 640x640
+    
+    // å½’ä¸€åŒ–: (img - [104, 117, 123]) * 1.0
+    const float mean[3] = {104.0f, 117.0f, 123.0f}; // BGR
+    const float std[3] = {1.0f, 1.0f, 1.0f};
+    image_to_blob(resized, blob_data, mean, std);
+}
+
+bool FacePipeline::RunDetection(const cv::Mat& image, std::vector<FaceBox>& boxes) {
+    float img_height = (float)image.rows;
+    float img_width = (float)image.cols;
+    
+    preprocess_detection(image, m_blob_buffer);
+    auto input_tensor = create_tensor(m_blob_buffer, m_det_input_shape);
+
+    auto output_tensors = m_session_detector->Run(Ort::RunOptions{nullptr},
+                                                  m_det_input_names.data(), &input_tensor, 1,
+                                                  m_det_output_names.data(), 2); // 2 outputs!
+    
+    const float* bboxes_data = output_tensors[0].GetTensorData<float>(); // [1, N, 4]
+    const float* probs_data = output_tensors[1].GetTensorData<float>();  // [1, N, 2]
+    long num_anchors = output_tensors[0].GetTensorTypeAndShapeInfo().GetShape()[1];
+
+    if (num_anchors != m_anchors.size()) {
+        LOGE("Anchor size mismatch! Expected %zu, Got %ld", m_anchors.size(), num_anchors);
+        return false;
+    }
+
+    std::vector<FaceBox> bbox_collection;
+    const float variance[2] = {0.1f, 0.2f}; //
+
+    for (long i = 0; i < num_anchors; ++i) {
+        float conf = probs_data[i * 2 + 1]; // (probs[0, i, 1])
+        if (conf < m_det_threshold) continue;
+
+        const Anchor& anchor = m_anchors[i];
+        float dx = bboxes_data[i * 4 + 0];
+        float dy = bboxes_data[i * 4 + 1];
+        float dw = bboxes_data[i * 4 + 2];
+        float dh = bboxes_data[i * 4 + 3];
+
+        float cx = anchor.cx + dx * variance[0] * anchor.s_kx; //
+        float cy = anchor.cy + dy * variance[0] * anchor.s_ky; //
+        float w = anchor.s_kx * std::exp(dw * variance[1]); //
+        float h = anchor.s_ky * std::exp(dh * variance[1]); //
+
+        bbox_collection.push_back({
+            (cx - w / 2.0f) * img_width,
+            (cy - h / 2.0f) * img_height,
+            (cx + w / 2.0f) * img_width,
+            (cy + h / 2.0f) * img_height,
+            conf
+        });
+    }
+    
+    boxes = hard_nms(bbox_collection, m_det_iou_threshold, m_det_topk); // (nms_type=0)
+    return !boxes.empty();
+}
+
+void FacePipeline::generate_anchors_faceboxes(int target_height, int target_width) {
+    // (generate_anchors)
+    m_anchors.clear();
+    std::vector<int> steps = {32, 64, 128};
+    std::vector<std::vector<int>> min_sizes = {{32, 64, 128}, {256}, {512}};
+    std::vector<std::vector<int>> feature_maps;
+    for (int step : steps) {
+        feature_maps.push_back({(int)std::ceil((float)target_height / step), (int)std::ceil((float)target_width / step)});
+    }
+
+    std::vector<float> offset_32 = {0.0f, 0.25f, 0.5f, 0.75f};
+    std::vector<float> offset_64 = {0.0f, 0.5f};
+
+    for (int k = 0; k < feature_maps.size(); ++k) {
+        auto f_map = feature_maps[k];
+        auto tmp_min_sizes = min_sizes[k];
+        int f_h = f_map[0];
+        int f_w = f_map[1];
+        for (int i = 0; i < f_h; ++i) {
+            for (int j = 0; j < f_w; ++j) {
+                for (int min_size : tmp_min_sizes) {
+                    float s_kx = (float)min_size / target_width;
+                    float s_ky = (float)min_size / target_height;
+                    
+                    if (min_size == 32) {
+                        for (float offset_y : offset_32) for (float offset_x : offset_32)
+                            m_anchors.push_back({(j + offset_x) * steps[k] / target_width, (i + offset_y) * steps[k] / target_height, s_kx, s_ky});
+                    } else if (min_size == 64) {
+                        for (float offset_y : offset_64) for (float offset_x : offset_64)
+                            m_anchors.push_back({(j + offset_x) * steps[k] / target_width, (i + offset_y) * steps[k] / target_height, s_kx, s_ky});
+                    } else {
+                        m_anchors.push_back({(j + 0.5f) * steps[k] / target_width, (i + 0.5f) * steps[k] / target_height, s_kx, s_ky});
+                    }
+                }
+            }
+        }
+    }
+}
+
+
+// --- æ­¥éª¤ 3: å§¿æ€ä¼°è®¡ (æ¥è‡ª imgchecker.py) ---
+void FacePipeline::preprocess_pose(const cv::Mat& img, std::vector<float>& blob_data) {
+    float pad = 0.3f; //
+    int h = img.rows;
+    int w = img.cols;
+    int nh = (int)(h + pad * h);
+    int nw = (int)(w + pad * w);
+    int nx1 = std::max(0, (nw - w) / 2);
+    int ny1 = std::max(0, (nh - h) / 2);
+
+    cv::Mat canvas = cv::Mat::zeros(nh, nw, CV_8UC3);
+    img.copyTo(canvas(cv::Rect(nx1, ny1, w, h)));
+    
+    cv::Mat resized;
+    cv::resize(canvas, resized, cv::Size(m_pose_var_input_shape[3], m_pose_var_input_shape[2])); // 64x64
+    
+    // å½’ä¸€åŒ–: (img - 127.5) / 127.5
+    const float mean[3] = {127.5f, 127.5f, 127.5f};
+    const float std[3] = {1.0f / 127.5f, 1.0f / 127.5f, 1.0f / 127.5f};
+    image_to_blob(resized, blob_data, mean, std);
+}
+
+bool FacePipeline::RunPose(const cv::Mat& face_crop, FacePose& pose) {
+    preprocess_pose(face_crop, m_blob_buffer);
+    
+    // è¿è¡Œ VAR
+    auto input_tensor_var = create_tensor(m_blob_buffer, m_pose_var_input_shape);
+    auto output_var = m_session_pose_var->Run(Ort::RunOptions{nullptr},
+                                              m_pose_var_input_names.data(), &input_tensor_var, 1,
+                                              m_pose_var_output_names.data(), 1);
+    
+    // è¿è¡Œ CONV (ä½¿ç”¨ç›¸åŒçš„ blob)
+    auto input_tensor_conv = create_tensor(m_blob_buffer, m_pose_conv_input_shape);
+    auto output_conv = m_session_pose_conv->Run(Ort::RunOptions{nullptr},
+                                                m_pose_conv_input_names.data(), &input_tensor_conv, 1,
+                                                m_pose_conv_output_names.data(), 1);
+
+    const float* data_var = output_var[0].GetTensorData<float>();
+    const float* data_conv = output_conv[0].GetTensorData<float>();
+
+    // ç»“åˆ (å¹³å‡)
+    pose.yaw = (data_var[0] + data_conv[0]) / 2.0f;
+    pose.pitch = (data_var[1] + data_conv[1]) / 2.0f;
+    pose.roll = (data_var[2] + data_conv[2]) / 2.0f;
+    return true;
+}
+
+// --- æ­¥éª¤ 4: å…³é”®ç‚¹æ£€æµ‹ (æ¥è‡ª facelandmarks5er.py) ---
+void FacePipeline::preprocess_landmark_net1(const cv::Mat& img, std::vector<float>& blob_data) {
+    cv::Mat resized, gray_img;
+    cv::resize(img, resized, cv::Size(m_lm1_input_shape[3], m_lm1_input_shape[2])); // 112x112
+    cv::cvtColor(resized, gray_img, cv::COLOR_BGR2GRAY); //
+    
+    // å½’ä¸€åŒ–: æ—  (0-255)
+    const float mean[1] = {0.0f};
+    const float std[1] = {1.0f};
+    image_to_blob(gray_img, blob_data, mean, std);
+}
+
+// C++ è½¬è¯‘ facelandmarks5er.py::shape_index_process
+std::vector<float> FacePipeline::shape_index_process(const Ort::Value& feat_val, const Ort::Value& pos_val) {
+    auto feat_shape = feat_val.GetTensorTypeAndShapeInfo().GetShape();
+    auto pos_shape = pos_val.GetTensorTypeAndShapeInfo().GetShape();
+    const float* feat_data = feat_val.GetTensorData<float>();
+    const float* pos_data = pos_val.GetTensorData<float>();
+
+    long feat_n = feat_shape[0]; // 1
+    long feat_c = feat_shape[1];
+    long feat_h = feat_shape[2];
+    long feat_w = feat_shape[3];
+    long pos_n = pos_shape[0]; // 1
+    long landmark_x2 = pos_shape[1]; // 10
+    int landmark_num = landmark_x2 / 2; // 5
+
+    float m_origin[] = {112.0f, 112.0f};
+    float m_origin_patch[] = {15.0f, 15.0f};
+
+    int x_patch_h = (int)(m_origin_patch[0] * feat_h / m_origin[0] + 0.5f);
+    int x_patch_w = (int)(m_origin_patch[1] * feat_w / m_origin[1] + 0.5f);
+    int feat_patch_h = x_patch_h;
+    int feat_patch_w = x_patch_w;
+
+    float r_h = (feat_patch_h - 1) / 2.0f;
+    float r_w = (feat_patch_w - 1) / 2.0f;
+
+    std::vector<long> out_shape = {feat_n, feat_c, x_patch_h, (long)landmark_num, x_patch_w};
+    std::vector<float> buff(feat_n * feat_c * x_patch_h * landmark_num * x_patch_w, 0.0f);
+
+    for (int i = 0; i < landmark_num; ++i) {
+        for (int n = 0; n < feat_n; ++n) {
+            float y_pos = pos_data[n * landmark_x2 + 2 * i + 1];
+            float x_pos = pos_data[n * landmark_x2 + 2 * i];
+            
+            int y = (int)(y_pos * (feat_h - 1) - r_h + 0.5f);
+            int x = (int)(x_pos * (feat_w - 1) - r_w + 0.5f);
+
+            for (int c = 0; c < feat_c; ++c) {
+                for (int ph = 0; ph < feat_patch_h; ++ph) {
+                    for (int pw = 0; pw < feat_patch_w; ++pw) {
+                        int y_p = y + ph;
+                        int x_p = x + pw;
+                        
+                        long out_idx = n * (feat_c * x_patch_h * landmark_num * x_patch_w) +
+                                       c * (x_patch_h * landmark_num * x_patch_w) +
+                                       ph * (landmark_num * x_patch_w) +
+                                       i * (x_patch_w) +
+                                       pw;
+
+                        if (y_p < 0 || y_p >= feat_h || x_p < 0 || x_p >= feat_w) {
+                            buff[out_idx] = 0.0f;
+                        } else {
+                            long feat_idx = n * (feat_c * feat_h * feat_w) +
+                                          c * (feat_h * feat_w) +
+                                          y_p * (feat_w) +
+                                          x_p;
+                            buff[out_idx] = feat_data[feat_idx];
+                        }
+                    }
+                }
+            }
+        }
+    }
+    return buff;
+}
+
+
+bool FacePipeline::RunLandmark(const cv::Mat& image, const FaceBox& box, FaceLandmark& landmark) {
+    // 1. è£å‰ªäººè„¸
+    cv::Rect face_rect_raw(box.x1, box.y1, box.x2 - box.x1, box.y2 - box.y1);
+    int pad_top = std::max(0, -face_rect_raw.y);
+    int pad_bottom = std::max(0, (face_rect_raw.y + face_rect_raw.height) - image.rows);
+    int pad_left = std::max(0, -face_rect_raw.x);
+    int pad_right = std::max(0, (face_rect_raw.x + face_rect_raw.width) - image.cols);
+    cv::Mat face_crop_padded;
+    cv::copyMakeBorder(image, face_crop_padded, pad_top, pad_bottom, pad_left, pad_right, cv::BORDER_CONSTANT, cv::Scalar(0,0,0));
+    cv::Rect face_rect_padded(face_rect_raw.x + pad_left, face_rect_raw.y + pad_top, face_rect_raw.width, face_rect_raw.height);
+    cv::Mat face_crop = face_crop_padded(face_rect_padded);
+    
+    // 2. é¢„å¤„ç† Net1
+    preprocess_landmark_net1(face_crop, m_blob_buffer);
+    auto input_tensor_net1 = create_tensor(m_blob_buffer, m_lm1_input_shape);
+
+    // 3. è¿è¡Œ Net1
+    auto output_net1 = m_session_landmarker1->Run(Ort::RunOptions{nullptr},
+                                                  m_lm1_input_names.data(), &input_tensor_net1, 1,
+                                                  m_lm1_output_names.data(), 2); // 2 outputs
+    
+    // 4. Shape Index Process
+    std::vector<float> shape_index_blob = shape_index_process(output_net1[0], output_net1[1]);
+    
+    // 5. å‡†å¤‡ Net2 è¾“å…¥
+    auto input_tensor_net2 = Ort::Value::CreateTensor<float>(m_memory_info,
+                                                             shape_index_blob.data(),
+                                                             shape_index_blob.size(),
+                                                             m_lm2_input_shape.data(),
+                                                             m_lm2_input_shape.size());
+
+    // 6. è¿è¡Œ Net2
+    auto output_net2 = m_session_landmarker2->Run(Ort::RunOptions{nullptr},
+                                                  m_lm2_input_names.data(), &input_tensor_net2, 1,
+                                                  m_lm2_output_names.data(), 1);
+
+    // 7. åŽå¤„ç†
+    const float* data_net1_pos = output_net1[1].GetTensorData<float>();
+    const float* data_net2 = output_net2[0].GetTensorData<float>();
+    auto shape_net1_pos = output_net1[1].GetTensorTypeAndShapeInfo().GetShape(); // [1, 10]
+    int landmark_x2 = shape_net1_pos[1];
+
+    float scale_x = (box.x2 - box.x1) / 112.0f;
+    float scale_y = (box.y2 - box.y1) / 112.0f;
+
+    for (int i = 0; i < 5; ++i) {
+        float x_norm = (data_net2[i * 2 + 0] + data_net1_pos[i * 2 + 0]) * 112.0f;
+        float y_norm = (data_net2[i * 2 + 1] + data_net1_pos[i * 2 + 1]) * 112.0f;
+        
+        float x = box.x1 + x_norm * scale_x;
+        float y = box.y1 + y_norm * scale_y;
+        
+        x = std::max(0.01f, std::min(x, (float)image.cols - 0.01f));
+        y = std::max(0.01f, std::min(y, (float)image.rows - 0.01f));
+        landmark.points[i] = cv::Point2f(x, y);
+    }
+    return true;
+}
+
+// --- æ­¥éª¤ 5: äººè„¸å¯¹é½ (æ¥è‡ª facealign.py) ---
+cv::Mat FacePipeline::RunAlignment(const cv::Mat& image, const FaceLandmark& landmark) {
+    // (align)
+    std::vector<cv::Point2f> src_points;
+    std::vector<cv::Point2f> dst_points;
+    
+    for (int i = 0; i < 5; ++i) {
+        src_points.push_back(landmark.points[i]);
+        dst_points.push_back(cv::Point2f(m_landmark_template.at<float>(i, 0), 
+                                         m_landmark_template.at<float>(i, 1)));
+    }
+    
+    // (transformation_maker) -> estimateAffinePartial2D
+    cv::Mat transform_matrix = cv::estimateAffinePartial2D(src_points, dst_points);
+    
+    cv::Mat aligned_face;
+    // (spatial_transform) -> warpAffine
+    // (crop_width, crop_height = 256, 256)
+    cv::warpAffine(image, aligned_face, transform_matrix, m_align_output_size, cv::INTER_LINEAR);
+    
+    return aligned_face;
+}
+
+// --- æ­¥éª¤ 6: ç‰¹å¾æå– (æ¥è‡ª facerecoger.py) ---
+void FacePipeline::preprocess_recognition(const cv::Mat& img, std::vector<float>& blob_data) {
+    cv::Mat resized, rgb_img;
+    // (resize to 248, 248)
+    cv::resize(img, resized, cv::Size(m_rec_input_shape[3], m_rec_input_shape[2])); 
+    // (BGR -> RGB)
+    cv::cvtColor(resized, rgb_img, cv::COLOR_BGR2RGB); 
+    
+    // å½’ä¸€åŒ–: æ—  (0-255)
+    const float mean[3] = {0.0f, 0.0f, 0.0f};
+    const float std[3] = {1.0f, 1.0f, 1.0f};
+    image_to_blob(rgb_img, blob_data, mean, std);
+}
+
+void FacePipeline::normalize_sqrt_l2(std::vector<float>& v) {
+    // (temp_result = np.sqrt(pred_result[0]))
     double norm = 0.0;
-    for (float val : v) {
+    for (float& val : v) {
+        val = std::sqrt(std::max(0.0f, val)); // å– sqrt
         norm += val * val;
     }
     
-    if (norm > 1e-6) { // é¿å…é™¤ä»¥é›¶
+    // (norm = temp_result / np.linalg.norm(...))
+    if (norm > 1e-6) {
         norm = std::sqrt(norm);
         for (float& val : v) {
             val = static_cast<float>(val / norm);
@@ -90,28 +598,22 @@ void FacePipeline::normalize_l2(std::vector<float>& v) {
     }
 }
 
+bool FacePipeline::RunRecognition(const cv::Mat& aligned_face, std::vector<float>& feature) {
+    preprocess_recognition(aligned_face, m_blob_buffer);
+    auto input_tensor = create_tensor(m_blob_buffer, m_rec_input_shape);
+    
+    auto output_tensors = m_session_recognizer->Run(Ort::RunOptions{nullptr},
+                                                    m_rec_input_names.data(), &input_tensor, 1,
+                                                    m_rec_output_names.data(), 1);
+
+    long feature_dim = output_tensors[0].GetTensorTypeAndShapeInfo().GetShape()[1];
+    const float* output_data = output_tensors[0].GetTensorData<float>();
+
+    feature.resize(feature_dim);
+    memcpy(feature.data(), output_data, feature_dim * sizeof(float));
+
+    // (åŽå¤„ç†: SQRT-L2 Norm)
+    normalize_sqrt_l2(feature);
 
-// Extract æ–¹æ³•çš„æ¡©å‡½æ•° (æˆ‘ä»¬å°†åœ¨ä¸‹ä¸€æ­¥å®žçŽ°)
-bool FacePipeline::Extract(const cv::Mat& image, std::vector<float>& feature) {
-    if (!m_initialized) {
-        std::cerr << "Pipeline is not initialized." << std::endl;
-        return false;
-    }
-    
-    if (image.empty()) {
-        std::cerr << "Input image is empty." << std::endl;
-        return false;
-    }
-    
-    // --------------------------------------------------
-    // TODO: åœ¨è¿™é‡Œå®žçŽ°å®Œæ•´çš„ 7 æ¨¡åž‹æŽ¨ç†ç®¡çº¿
-    // --------------------------------------------------
-    
-    // std::cout << "Extract method is not implemented yet." << std::endl;
-    
-    // ä¸´æ—¶å¡«å……ä¸€ä¸ªå‡çš„ç‰¹å¾å‘é‡
-    feature.assign(512, 0.5f);
-    normalize_l2(feature);
-    
     return true;
 }
\ No newline at end of file
diff --git a/src/face_pipeline.h b/src/face_pipeline.h
index d41a8f5..8d413db 100644
--- a/src/face_pipeline.h
+++ b/src/face_pipeline.h
@@ -4,17 +4,21 @@
 #include <vector>
 #include <memory>
 #include <stdexcept>
-
-// ONNX Runtime C++ API
-#include "onnxruntime_cxx_api.h"
-
-// OpenCV
-#include "opencv2/opencv.hpp"
-
-// ä¸º compare_features æä¾›è¾…åŠ©å‡½æ•°
-#include <numeric>
+#include <array>
 #include <cmath>
+#include <numeric>
 #include <algorithm>
+#include <android/log.h>
+
+#include "onnxruntime_cxx_api.h"
+#include "opencv2/opencv.hpp"
+#include "opencv2/calib3d.hpp" // for estimateAffinePartial2D
+
+// --- æ—¥å¿—å® ---
+#define LOG_TAG "FacePipeline_CPP"
+#define LOGI(...) __android_log_print(ANDROID_LOG_INFO, LOG_TAG, __VA_ARGS__)
+#define LOGE(...) __android_log_print(ANDROID_LOG_ERROR, LOG_TAG, __VA_ARGS__)
+
 
 /**
  * @brief è®¡ç®—ä¸¤ä¸ªL2å½’ä¸€åŒ–çš„ç‰¹å¾å‘é‡çš„ä½™å¼¦ç›¸ä¼¼åº¦
@@ -30,6 +34,62 @@ inline float compare_features(const std::vector<float>& v1, const std::vector<fl
     return std::max(-1.0f, std::min(1.0f, static_cast<float>(dot_product)));
 }
 
+// --- è¾…åŠ©ç»“æž„ä½“ (ä¸Ž facedetector.py::Box å¯¹åº”) ---
+struct FaceBox {
+    float x1, y1, x2, y2, score;
+};
+
+struct FaceLandmark {
+    std::array<cv::Point2f, 5> points;
+};
+
+struct FacePose {
+    float yaw, pitch, roll;
+};
+
+// --- NMS è¾…åŠ©å‡½æ•° (ä¸Ž facedetector.py::hard_nms å¯¹åº”) ---
+inline float iou_of(const FaceBox& a, const FaceBox& b) {
+    float inter_x1 = std::max(a.x1, b.x1);
+    float inter_y1 = std::max(a.y1, b.y1);
+    float inter_x2 = std::min(a.x2, b.x2);
+    float inter_y2 = std::min(a.y2, b.y2);
+
+    if (inter_x1 < inter_x2 && inter_y1 < inter_y2) {
+        float inter_area = (inter_x2 - inter_x1 + 1.0f) * (inter_y2 - inter_y1 + 1.0f);
+        float a_area = (a.x2 - a.x1 + 1.0f) * (a.y2 - a.y1 + 1.0f);
+        float b_area = (b.x2 - b.x1 + 1.0f) * (b.y2 - b.y1 + 1.0f);
+        float union_area = a_area + b_area - inter_area;
+        return inter_area / union_area;
+    }
+    return 0.0f;
+}
+
+inline std::vector<FaceBox> hard_nms(std::vector<FaceBox>& boxes, float iou_threshold, int topk) {
+    if (boxes.empty()) return {};
+    std::sort(boxes.begin(), boxes.end(), [](const FaceBox& a, const FaceBox& b) {
+        return a.score > b.score;
+    });
+
+    std::vector<int> merged(boxes.size(), 0);
+    std::vector<FaceBox> output;
+
+    for (int i = 0; i < boxes.size(); ++i) {
+        if (merged[i]) continue;
+        
+        output.push_back(boxes[i]);
+        merged[i] = 1;
+
+        for (int j = i + 1; j < boxes.size(); ++j) {
+            if (merged[j]) continue;
+            if (iou_of(boxes[i], boxes[j]) > iou_threshold) {
+                merged[j] = 1;
+            }
+        }
+        if (output.size() >= topk) break;
+    }
+    return output;
+}
+
 
 /**
  * @class FacePipeline
@@ -37,43 +97,53 @@ inline float compare_features(const std::vector<float>& v1, const std::vector<fl
  */
 class FacePipeline {
 public:
-    /**
-     * @brief æž„é€ å‡½æ•°ã€‚
-     * @param model_dir åŒ…å«æ‰€æœ‰.onnxæ–‡ä»¶çš„ç›®å½•è·¯å¾„ã€‚
-     * @note æž„é€ æ—¶ä¼šç«‹å³å°è¯•åŠ è½½æ‰€æœ‰æ¨¡åž‹ã€‚
-     */
     FacePipeline(const std::string& model_dir);
-    
     ~FacePipeline();
-
-    /**
-     * @brief æ£€æŸ¥æ¨¡åž‹æ˜¯å¦å·²æˆåŠŸåˆå§‹åŒ–
-     * @return true æˆåŠŸ, false å¤±è´¥
-     */
     bool IsInitialized() const { return m_initialized; }
-
-    /**
-     * @brief æå–äººè„¸ç‰¹å¾ (æ ¸å¿ƒæŽ¥å£1)
-     * @param image å‘å¸ƒçš„åŽŸå§‹å›¾åƒ (BGRæ ¼å¼)
-     * @param feature (è¾“å‡º) æå–çš„512ç»´L2å½’ä¸€åŒ–ç‰¹å¾
-     * @return true æˆåŠŸæå–, false æœªæ£€æµ‹åˆ°åˆæ ¼äººè„¸æˆ–å‡ºé”™
-     */
     bool Extract(const cv::Mat& image, std::vector<float>& feature);
 
 private:
-    /**
-     * @brief (å†…éƒ¨) ç”±æž„é€ å‡½æ•°è°ƒç”¨ï¼ŒåŠ è½½æ‰€æœ‰7ä¸ªæ¨¡åž‹
-     */
+    // --- æ¨¡åž‹åŠ è½½ä¸Žåˆå§‹åŒ– ---
     bool LoadModels(const std::string& model_dir);
+    void InitMemoryAllocators();
 
-    /**
-     * @brief (å†…éƒ¨) L2å½’ä¸€åŒ–å‘é‡
-     */
-    void normalize_l2(std::vector<float>& v);
+    // --- æ ¸å¿ƒç®¡çº¿æ­¥éª¤ ---
+    void preprocess_rotation(const cv::Mat &image, std::vector<float> &blob_data);
+    int RunRotation(const cv::Mat& image); // [æ¨¡åž‹5]
+    bool RunDetection(const cv::Mat& image, std::vector<FaceBox>& boxes); // [æ¨¡åž‹1]
+    bool RunPose(const cv::Mat& face_crop, FacePose& pose); // [æ¨¡åž‹6, 7]
+    bool RunLandmark(const cv::Mat& image, const FaceBox& box, FaceLandmark& landmark); // [æ¨¡åž‹2, 3]
+    cv::Mat RunAlignment(const cv::Mat& image, const FaceLandmark& landmark); //
+    bool RunRecognition(const cv::Mat& aligned_face, std::vector<float>& feature); // [æ¨¡åž‹4]
+    
+    // --- é¢„å¤„ç†/åŽå¤„ç† è¾…åŠ©å‡½æ•° ---
+    
+    // [æ¨¡åž‹1] FaceBoxesV2
+    struct Anchor { float cx, cy, s_kx, s_ky; };
+    std::vector<Anchor> m_anchors;
+    void generate_anchors_faceboxes(int target_height, int target_width);
+    void preprocess_detection(const cv::Mat& img, std::vector<float>& blob_data);
+
+    // [æ¨¡åž‹6, 7] FSANet
+    void preprocess_pose(const cv::Mat& img, std::vector<float>& blob_data);
+
+    // [æ¨¡åž‹2, 3] Landmark5er
+    void preprocess_landmark_net1(const cv::Mat& img, std::vector<float>& blob_data);
+    std::vector<float> shape_index_process(const Ort::Value& feat_data, const Ort::Value& pos_data);
+
+    // [æ¨¡åž‹4] FaceRecognizer
+    void preprocess_recognition(const cv::Mat& img, std::vector<float>& blob_data);
+    void normalize_sqrt_l2(std::vector<float>& v); //
+
+    // é€šç”¨
+    void image_to_blob(const cv::Mat& img, std::vector<float>& blob, const float* mean, const float* std);
+    Ort::Value create_tensor(const std::vector<float>& blob_data, const std::vector<int64_t>& input_shape);
 
     // --- ONNX Runtime æ ¸å¿ƒç»„ä»¶ ---
     Ort::Env m_env;
     Ort::SessionOptions m_session_options;
+    Ort::AllocatorWithDefaultOptions m_allocator;
+    Ort::MemoryInfo m_memory_info;
     bool m_initialized = false;
 
     // --- 7ä¸ªæ¨¡åž‹çš„ä¼šè¯ (Session) ---
@@ -84,4 +154,43 @@ private:
     std::unique_ptr<Ort::Session> m_session_rotator;
     std::unique_ptr<Ort::Session> m_session_pose_var;
     std::unique_ptr<Ort::Session> m_session_pose_conv;
+
+    // --- ONNXæ¨¡åž‹è¾“å…¥/è¾“å‡ºåç§° (C-style strings) ---
+    // æˆ‘ä»¬åœ¨åŠ è½½æ¨¡åž‹æ—¶èŽ·å–è¿™äº›
+    std::vector<const char*> m_rot_input_names, m_rot_output_names;
+    std::vector<int64_t> m_rot_input_shape;
+
+    std::vector<const char*> m_det_input_names, m_det_output_names;
+    std::vector<int64_t> m_det_input_shape;
+    
+    std::vector<const char*> m_pose_var_input_names, m_pose_var_output_names;
+    std::vector<int64_t> m_pose_var_input_shape;
+
+    std::vector<const char*> m_pose_conv_input_names, m_pose_conv_output_names;
+    std::vector<int64_t> m_pose_conv_input_shape;
+
+    std::vector<const char*> m_lm1_input_names, m_lm1_output_names;
+    std::vector<int64_t> m_lm1_input_shape;
+
+    std::vector<const char*> m_lm2_input_names, m_lm2_output_names;
+    std::vector<int64_t> m_lm2_input_shape;
+
+    std::vector<const char*> m_rec_input_names, m_rec_output_names;
+    std::vector<int64_t> m_rec_input_shape;
+    
+    // --- ä¸´æ—¶ç¼“å†²åŒº ---
+    std::vector<float> m_blob_buffer;
+
+    // --- å¸¸é‡ (æ¥è‡ª Python) ---
+    const float m_det_threshold = 0.35f;
+    const float m_det_iou_threshold = 0.45f;
+    const int m_det_topk = 300;
+    const float m_pose_threshold = 30.0f; // (æ¥è‡ª face_feature_extractor.py)
+    const cv::Mat m_landmark_template = (cv::Mat_<float>(5, 2) <<
+        89.3095f, 72.9025f,  // (æ¥è‡ª facealign.py)
+        169.3095f, 72.9025f, //
+        127.8949f, 127.0441f, //
+        96.8796f, 184.8907f, //
+        159.1065f, 184.7601f); //
+    const cv::Size m_align_output_size = cv::Size(256, 256); //
 };
\ No newline at end of file
diff --git a/src/face_sdk_api.cpp b/src/face_sdk_api.cpp
index e69de29..991699b 100644
--- a/src/face_sdk_api.cpp
+++ b/src/face_sdk_api.cpp
@@ -0,0 +1,66 @@
+#include "face_sdk.h"
+#include "face_pipeline.h" // åœ¨ .cpp ä¸­åŒ…å«å®žçŽ°
+#include <memory>
+
+// --- Pimpl å®žçŽ° ---
+// æˆ‘ä»¬åœ¨ .cpp æ–‡ä»¶ä¸­å®šä¹‰ç§æœ‰å®žçŽ°ç±»
+class FaceSDK::Impl {
+public:
+    // Impl çš„æž„é€ å‡½æ•°çœŸæ­£åˆ›å»ºäº† FacePipeline
+    Impl(const std::string& model_dir) 
+        : pipeline(std::make_unique<FacePipeline>(model_dir)) 
+    {
+        // æž„é€ å‡½æ•°ä½“
+    }
+
+    // æ£€æŸ¥å†…éƒ¨ç®¡çº¿æ˜¯å¦OK
+    bool IsInitialized() const {
+        return pipeline && pipeline->IsInitialized();
+    }
+
+    // æŒæœ‰æ ¸å¿ƒç®¡çº¿çš„æ™ºèƒ½æŒ‡é’ˆ
+    std::unique_ptr<FacePipeline> pipeline;
+};
+
+// --- FaceSDK å…¬å…±æ–¹æ³•çš„å®žçŽ° ---
+
+// æž„é€ å‡½æ•°ï¼šåˆ›å»º Impl å®žä¾‹
+FaceSDK::FaceSDK(const std::string& model_dir) 
+    : m_impl(std::make_unique<Impl>(model_dir))
+{
+    // æž„é€ å‡½æ•°ä½“
+}
+
+// æžæž„å‡½æ•°ï¼šå¿…é¡»åœ¨ .cpp ä¸­å®šä¹‰ï¼Œå› ä¸º Impl æ˜¯ä¸å®Œæ•´ç±»åž‹
+FaceSDK::~FaceSDK() = default;
+
+// IsInitialized çš„å®žçŽ°
+bool FaceSDK::IsInitialized() const {
+    if (!m_impl) return false;
+    return m_impl->IsInitialized();
+}
+
+// Compare çš„å®žçŽ° (è¿™æ˜¯ä¸€ä¸ªç®€å•çš„è¾…åŠ©å‡½æ•°)
+float FaceSDK::Compare(const std::vector<float>& feat1, const std::vector<float>& feat2) {
+    // è°ƒç”¨æˆ‘ä»¬åœ¨ face_pipeline.h ä¸­å®šä¹‰çš„å…¨å±€è¾…åŠ©å‡½æ•°
+    return compare_features(feat1, feat2);
+}
+
+// ExtractFeature çš„å®žçŽ°
+SDKExtractResult FaceSDK::ExtractFeature(const cv::Mat& image) {
+    if (!IsInitialized()) {
+        return { SDKStatus::NOT_INITIALIZED, {}, "SDK æœªåˆå§‹åŒ–" };
+    }
+    if (image.empty()) {
+        return { SDKStatus::INVALID_INPUT, {}, "è¾“å…¥å›¾åƒä¸ºç©º" };
+    }
+
+    std::vector<float> feature;
+    bool success = m_impl->pipeline->Extract(image, feature);
+
+    if (success) {
+        return { SDKStatus::SUCCESS, feature, "æå–æˆåŠŸ" };
+    } else {
+        return { SDKStatus::PIPELINE_ERROR, {}, "æœªæ£€æµ‹åˆ°åˆæ ¼äººè„¸æˆ–ç®—æ³•å‡ºé”™" };
+    }
+}
\ No newline at end of file
diff --git a/src/face_sdk_jni.cpp b/src/face_sdk_jni.cpp
index e69de29..dc7ff56 100644
--- a/src/face_sdk_jni.cpp
+++ b/src/face_sdk_jni.cpp
@@ -0,0 +1,184 @@
+#include <jni.h>
+#include <string>
+#include <vector>
+#include <android/log.h>
+#include <android/bitmap.h> // ç”¨äºŽ Bitmap -> cv::Mat
+
+#include "face_sdk.h"       // æˆ‘ä»¬çš„ C++ API
+#include "opencv2/opencv.hpp"
+
+// --- æ—¥å¿—å® ---
+#define LOG_TAG "FaceSDK_JNI"
+#define LOGI(...) __android_log_print(ANDROID_LOG_INFO, LOG_TAG, __VA_ARGS__)
+#define LOGE(...) __android_log_print(ANDROID_LOG_ERROR, LOG_TAG, __VA_ARGS__)
+
+// --- å…¨å±€ SDK å®žä¾‹ ---
+// æˆ‘ä»¬å°† C++ SDK å®žä¾‹ä¿å­˜åœ¨ä¸€ä¸ªå…¨å±€æ™ºèƒ½æŒ‡é’ˆä¸­
+// æŒ‡é’ˆ (long) å°†è¢«è¿”å›žç»™ Java å±‚æŒæœ‰
+std::unique_ptr<FaceSDK> g_sdk_instance;
+
+// --- è¾…åŠ©å‡½æ•°ï¼šBitmap è½¬ cv::Mat ---
+bool ConvertBitmapToMat(JNIEnv* env, jobject j_bitmap, cv::Mat& out_mat) {
+    AndroidBitmapInfo bmp_info;
+    if (AndroidBitmap_getInfo(env, j_bitmap, &bmp_info) < 0) {
+        LOGE("AndroidBitmap_getInfo() failed");
+        return false;
+    }
+
+    // åªæ”¯æŒ RGBA_8888
+    if (bmp_info.format != ANDROID_BITMAP_FORMAT_RGBA_8888) {
+        LOGE("Unsupported bitmap format. Only RGBA_8888 is supported.");
+        return false;
+    }
+
+    void* bmp_pixels;
+    if (AndroidBitmap_lockPixels(env, j_bitmap, &bmp_pixels) < 0) {
+        LOGE("AndroidBitmap_lockPixels() failed");
+        return false;
+    }
+
+    // åˆ›å»ºä¸€ä¸ª cv::Mat æ¥åŒ…è£… Bitmap åƒç´ 
+    // æ³¨æ„ï¼šè¿™æ˜¯ RGBA æ ¼å¼
+    cv::Mat tmp_mat(bmp_info.height, bmp_info.width, CV_8UC4, bmp_pixels);
+    
+    // æˆ‘ä»¬çš„äººè„¸ç®¡çº¿éœ€è¦ BGR æ ¼å¼
+    // TODO: ç¡®è®¤ python ç®¡çº¿æ˜¯å¦éœ€è¦ RGBã€‚cv::cvtColoræ›´å®‰å…¨ã€‚
+    cv::cvtColor(tmp_mat, out_mat, cv::COLOR_RGBA2BGR);
+
+    AndroidBitmap_unlockPixels(env, j_bitmap);
+    return true;
+}
+
+
+// --- JNI æŽ¥å£å®žçŽ° ---
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+// JNI å‡½æ•°å‘½åè§„åˆ™: Java_åŒ…å_ç±»å_æ–¹æ³•å
+// ã€ã€ã€è¯·å°† "com_facesdk_wrapper_FaceSDKWrapper" æ›¿æ¢ä¸ºæ‚¨è‡ªå·±çš„åŒ…åå’Œç±»åã€‘ã€‘ã€‘
+
+/**
+ * @brief åˆå§‹åŒ– SDK
+ * @param env JNIEnv
+ * @param thiz Java å±‚çš„ 'this'
+ * @param j_model_dir (String) åŒ…å« .onnx æ–‡ä»¶çš„è·¯å¾„
+ * @return (long) æŒ‡å‘ C++ FaceSDK å®žä¾‹çš„æŒ‡é’ˆã€‚å¦‚æžœä¸º 0ï¼Œåˆ™åˆå§‹åŒ–å¤±è´¥ã€‚
+ */
+JNIEXPORT jlong JNICALL
+Java_com_facesdk_wrapper_FaceSDKWrapper_nativeInit(JNIEnv *env, jobject thiz, jstring j_model_dir) {
+    const char *model_dir_cstr = env->GetStringUTFChars(j_model_dir, nullptr);
+    if (model_dir_cstr == nullptr) {
+        LOGE("Failed to get model dir string");
+        return 0; // è¿”å›ž 0 (null)
+    }
+    
+    std::string model_dir(model_dir_cstr);
+    env->ReleaseStringUTFChars(j_model_dir, model_dir_cstr);
+
+    LOGI("Initializing FaceSDK with model path: %s", model_dir.c_str());
+
+    try {
+        g_sdk_instance = std::make_unique<FaceSDK>(model_dir);
+        
+        if (g_sdk_instance && g_sdk_instance->IsInitialized()) {
+            LOGI("SDK Initialized successfully.");
+            // è¿”å›žå®žä¾‹çš„æŒ‡é’ˆåœ°å€ (è½¬ä¸º long)
+            return (jlong)g_sdk_instance.get();
+        } else {
+            LOGE("SDK g_sdk_instance->IsInitialized() failed.");
+            g_sdk_instance.reset(); // é‡Šæ”¾å†…å­˜
+            return 0;
+        }
+    } catch (const std::exception& e) {
+        LOGE("SDK Initialization failed with exception: %s", e.what());
+        g_sdk_instance.reset();
+        return 0;
+    }
+}
+
+/**
+ * @brief é‡Šæ”¾ SDK
+ */
+JNIEXPORT void JNICALL
+Java_com_facesdk_wrapper_FaceSDKWrapper_nativeRelease(JNIEnv *env, jobject thiz) {
+    LOGI("Releasing SDK instance.");
+    g_sdk_instance.reset(); // é‡Šæ”¾æ™ºèƒ½æŒ‡é’ˆç®¡ç†çš„å†…å­˜
+}
+
+/**
+ * @brief æå–ç‰¹å¾
+ * @param env JNIEnv
+ * @param thiz Java å±‚çš„ 'this'
+ * @param j_bitmap (Bitmap) å¾…å¤„ç†çš„å›¾åƒ
+ * @return (float[]) 512ç»´ç‰¹å¾å‘é‡ï¼Œå¦‚æžœå¤±è´¥åˆ™è¿”å›ž null
+ */
+JNIEXPORT jfloatArray JNICALL
+Java_com_facesdk_wrapper_FaceSDKWrapper_nativeExtractFeature(JNIEnv *env, jobject thiz, jobject j_bitmap) {
+    if (!g_sdk_instance) {
+        LOGE("SDK not initialized. Call init() first.");
+        return nullptr;
+    }
+
+    // 1. Bitmap -> cv::Mat
+    cv::Mat image_bgr;
+    if (!ConvertBitmapToMat(env, j_bitmap, image_bgr)) {
+        LOGE("Failed to convert Bitmap to cv::Mat");
+        return nullptr;
+    }
+
+    // 2. è°ƒç”¨ C++ API
+    SDKExtractResult result = g_sdk_instance->ExtractFeature(image_bgr);
+
+    if (result.status != SDKStatus::SUCCESS) {
+        LOGE("Feature extraction failed: %s", result.message.c_str());
+        return nullptr;
+    }
+
+    // 3. std::vector<float> -> jfloatArray
+    jfloatArray j_feature = env->NewFloatArray(result.feature.size());
+    if (j_feature == nullptr) {
+        LOGE("Failed to create new jfloatArray");
+        return nullptr;
+    }
+    env->SetFloatArrayRegion(j_feature, 0, result.feature.size(), result.feature.data());
+    
+    return j_feature;
+}
+
+/**
+ * @brief æ¯”è¾ƒç‰¹å¾
+ * @param env JNIEnv
+ * @param thiz Java å±‚çš„ 'this'
+ * @param j_feat1 (float[]) ç‰¹å¾1
+ * @param j_feat2 (float[]) ç‰¹å¾2
+ * @return (float) ä½™å¼¦ç›¸ä¼¼åº¦
+ */
+JNIEXPORT jfloat JNICALL
+Java_com_facesdk_wrapper_FaceSDKWrapper_nativeCompare(JNIEnv *env, jobject thiz, jfloatArray j_feat1, jfloatArray j_feat2) {
+    if (!g_sdk_instance) {
+        LOGE("SDK not initialized.");
+        return -2.0f; // è¿”å›žæ— æ•ˆå€¼
+    }
+
+    // 1. jfloatArray -> std::vector<float>
+    jsize len1 = env->GetArrayLength(j_feat1);
+    jfloat* body1 = env->GetFloatArrayElements(j_feat1, nullptr);
+    std::vector<float> feat1(body1, body1 + len1);
+    env->ReleaseFloatArrayElements(j_feat1, body1, 0);
+
+    // 2. jfloatArray -> std::vector<float>
+    jsize len2 = env->GetArrayLength(j_feat2);
+    jfloat* body2 = env->GetFloatArrayElements(j_feat2, nullptr);
+    std::vector<float> feat2(body2, body2 + len2);
+    env->ReleaseFloatArrayElements(j_feat2, body2, 0);
+
+    // 3. è°ƒç”¨ C++ API
+    return g_sdk_instance->Compare(feat1, feat2);
+}
+
+
+#ifdef __cplusplus
+}
+#endif
\ No newline at end of file