#include "yolo11_buff.hpp" const double ConfidenceThreshold = 0.7f; const double IouThreshold = 0.4f; namespace auto_buff { YOLO11_BUFF::YOLO11_BUFF(const std::string & config) { auto yaml = YAML::LoadFile(config); std::string model_path = yaml["model"].as(); model = core.read_model(model_path); // printInputAndOutputsInfo(*model); // 打印模型信息 /// 载入并编译模型 compiled_model = core.compile_model(model, "CPU"); /// 创建推理请求 infer_request = compiled_model.create_infer_request(); // 获取模型输入节点 input_tensor = infer_request.get_input_tensor(); input_tensor.set_shape({1, 3, 640, 640}); } std::vector YOLO11_BUFF::get_multicandidateboxes(cv::Mat & image) { const int64 start = cv::getTickCount(); // 设置模型输入 /// 预处理 // const float factor = fill_tensor_data_image(input_tensor, image); // 填充图片到合适的input size if (image.empty()) { tools::logger()->warn("Empty img!, camera drop!"); return std::vector (); } cv::Mat bgr_img = image; auto x_scale = static_cast(640) / bgr_img.rows; auto y_scale = static_cast(640) / bgr_img.cols; auto scale = std::min(x_scale, y_scale); auto h = static_cast(bgr_img.rows * scale); auto w = static_cast(bgr_img.cols * scale); double factor = scale; // preproces auto input = cv::Mat(640, 640, CV_8UC3, cv::Scalar(0, 0, 0)); auto roi = cv::Rect(0, 0, w, h); cv::resize(bgr_img, input(roi), {w, h}); ov::Tensor input_tensor(ov::element::u8, {1, 640, 640, 3}, input.data); /// 执行推理计算 infer_request.infer(); /// 处理推理计算结果 const ov::Tensor output = infer_request.get_output_tensor(); // 获得推理结果 const ov::Shape output_shape = output.get_shape(); const float * output_buffer = output.data(); const int out_rows = output_shape[1]; // 获得"output"节点的rows 15 const int out_cols = output_shape[2]; // 获得"output"节点的cols 8400 const cv::Mat det_output( out_rows, out_cols, CV_32F, (float *)output_buffer); // output_buff类型转换 std::vector boxes; // 目标框 std::vector confidences; // 置信度 std::vector> objects_keypoints; // 关键点 // 输出格式是[15,8400], 每列代表一个框(即最多有8400个框), 前面4行分别是[cx, cy, ow, oh], 中间score, 最后5*2关键点(3代表每个关键点的信息, 包括[x, y, visibility],如果是2，则没有visibility) // 15 = 4 + 1 + NUM_POINTS * 2 56 for (int i = 0; i < det_output.cols; ++i) { const float score = det_output.at(4, i); // 如果置信度满足条件则放进vector if (score > ConfidenceThreshold) { // 获取目标框 const float cx = det_output.at(0, i); const float cy = det_output.at(1, i); const float ow = det_output.at(2, i); const float oh = det_output.at(3, i); cv::Rect box; box.x = static_cast((cx - 0.5 * ow) * factor); box.y = static_cast((cy - 0.5 * oh) * factor); box.width = static_cast(ow * factor); box.height = static_cast(oh * factor); boxes.push_back(box); // 获取置信度 confidences.push_back(score); // 获取关键点 std::vector keypoints; cv::Mat kpts = det_output.col(i).rowRange(NUM_POINTS, 15); for (int j = 0; j < NUM_POINTS; ++j) { const float x = kpts.at(j * 2 + 0, 0) * factor; const float y = kpts.at(j * 2 + 1, 0) * factor; // const float s = kpts.at(j * 3 + 2, 0); keypoints.push_back(x); keypoints.push_back(y); // keypoints.push_back(s); } objects_keypoints.push_back(keypoints); } } /// NMS,消除具有较低置信度的冗余重叠框,用于处理多个框的情况 std::vector indexes; cv::dnn::NMSBoxes(boxes, confidences, ConfidenceThreshold, IouThreshold, indexes); std::vector