// This file is part of OpenCV project. // It is subject to the license terms in the LICENSE file found in the top-level directory // of this distribution and at http://opencv.org/license.html. #include "test_precomp.hpp" namespace opencv_test { namespace { // label format: // image_name // num_face // face_1 // face_.. // face_num std::map blobFromTXT(const std::string& path, int numCoords) { std::ifstream ifs(path.c_str()); CV_Assert(ifs.is_open()); std::map gt; Mat faces; int faceNum = -1; int faceCount = 0; for (std::string line, key; getline(ifs, line); ) { std::istringstream iss(line); if (line.find(".png") != std::string::npos) { // Get filename iss >> key; } else if (line.find(" ") == std::string::npos) { // Get the number of faces iss >> faceNum; } else { // Get faces Mat face(1, numCoords, CV_32FC1); for (int j = 0; j < numCoords; j++) { iss >> face.at(0, j); } faces.push_back(face); faceCount++; } if (faceCount == faceNum) { // Store faces gt[key] = faces; faces.release(); faceNum = -1; faceCount = 0; } } return gt; } TEST(Objdetect_face_detection, regression) { // Pre-set params float scoreThreshold = 0.7f; float matchThreshold = 0.7f; float l2disThreshold = 15.0f; int numLM = 5; int numCoords = 4 + 2 * numLM; // Load ground truth labels std::map gt = blobFromTXT(findDataFile("dnn_face/detection/cascades_labels.txt"), numCoords); // Initialize detector std::string model = findDataFile("dnn/onnx/models/yunet-202303.onnx", false); Ptr faceDetector = FaceDetectorYN::create(model, "", Size(300, 300)); faceDetector->setScoreThreshold(0.7f); // Detect and match for (auto item: gt) { std::string imagePath = findDataFile("cascadeandhog/images/" + item.first); Mat image = imread(imagePath); // Set input size faceDetector->setInputSize(image.size()); // Run detection Mat faces; faceDetector->detect(image, faces); // std::cout << item.first << " " << item.second.rows << " " << faces.rows << std::endl; // Match bboxes and landmarks std::vector matchedItem(item.second.rows, false); for (int i = 0; i < faces.rows; i++) { if (faces.at(i, numCoords) < scoreThreshold) continue; bool boxMatched = false; std::vector lmMatched(numLM, false); cv::Rect2f resBox(faces.at(i, 0), faces.at(i, 1), faces.at(i, 2), faces.at(i, 3)); for (int j = 0; j < item.second.rows && !boxMatched; j++) { if (matchedItem[j]) continue; // Retrieve bbox and compare IoU cv::Rect2f gtBox(item.second.at(j, 0), item.second.at(j, 1), item.second.at(j, 2), item.second.at(j, 3)); double interArea = (resBox & gtBox).area(); double iou = interArea / (resBox.area() + gtBox.area() - interArea); if (iou >= matchThreshold) { boxMatched = true; matchedItem[j] = true; } // Match landmarks if bbox is matched if (!boxMatched) continue; for (int lmIdx = 0; lmIdx < numLM; lmIdx++) { float gtX = item.second.at(j, 4 + 2 * lmIdx); float gtY = item.second.at(j, 4 + 2 * lmIdx + 1); float resX = faces.at(i, 4 + 2 * lmIdx); float resY = faces.at(i, 4 + 2 * lmIdx + 1); float l2dis = cv::sqrt((gtX - resX) * (gtX - resX) + (gtY - resY) * (gtY - resY)); if (l2dis <= l2disThreshold) { lmMatched[lmIdx] = true; } } break; } EXPECT_TRUE(boxMatched) << "In image " << item.first << ", cannot match resBox " << resBox << " with any ground truth."; if (boxMatched) { EXPECT_TRUE(std::all_of(lmMatched.begin(), lmMatched.end(), [](bool v) { return v; })) << "In image " << item.first << ", resBox " << resBox << " matched but its landmarks failed to match."; } } } } TEST(Objdetect_face_recognition, regression) { // Pre-set params float score_thresh = 0.9f; float nms_thresh = 0.3f; double cosine_similar_thresh = 0.363; double l2norm_similar_thresh = 1.128; // Load ground truth labels std::ifstream ifs(findDataFile("dnn_face/recognition/cascades_label.txt").c_str()); CV_Assert(ifs.is_open()); std::set fSet; std::map featureMap; std::map, int> gtMap; for (std::string line, key; getline(ifs, line);) { std::string fname1, fname2; int label; std::istringstream iss(line); iss>>fname1>>fname2>>label; // std::cout< faceDetector = FaceDetectorYN::create(detect_model, "", Size(150, 150), score_thresh, nms_thresh); std::string recog_model = findDataFile("dnn/onnx/models/face_recognizer_fast.onnx", false); Ptr faceRecognizer = FaceRecognizerSF::create(recog_model, ""); // Detect and match for (auto fname: fSet) { std::string imagePath = findDataFile("dnn_face/recognition/" + fname); Mat image = imread(imagePath); Mat faces; faceDetector->detect(image, faces); Mat aligned_face; faceRecognizer->alignCrop(image, faces.row(0), aligned_face); Mat feature; faceRecognizer->feature(aligned_face, feature); featureMap[fname] = feature.clone(); } for (auto item: gtMap) { Mat feature1 = featureMap[item.first.first]; Mat feature2 = featureMap[item.first.second]; int label = item.second; double cos_score = faceRecognizer->match(feature1, feature2, FaceRecognizerSF::DisType::FR_COSINE); double L2_score = faceRecognizer->match(feature1, feature2, FaceRecognizerSF::DisType::FR_NORM_L2); EXPECT_TRUE(label == 0 ? cos_score <= cosine_similar_thresh : cos_score > cosine_similar_thresh) << "Cosine match result of images " << item.first.first << " and " << item.first.second << " is different from ground truth (score: "<< cos_score <<";Thresh: "<< cosine_similar_thresh <<")."; EXPECT_TRUE(label == 0 ? L2_score > l2norm_similar_thresh : L2_score <= l2norm_similar_thresh) << "L2norm match result of images " << item.first.first << " and " << item.first.second << " is different from ground truth (score: "<< L2_score <<";Thresh: "<< l2norm_similar_thresh <<")."; } } }} // namespace