// 计算 anchor box 的坐标 for (int z = 0; z < D; ++z) { for (int y = 0; y < H; ++y) { for (int x = 0; x < W; ++x) { for (int a = 0; a < anchors.size(); ++a) { windows.row(index) << oz[z], oh[y], ow[x], anchors[a][0], anchors[a][1], anchors[a][2]; ++index; } } } }

这段代码是用于计算目标检测中的 anchor boxes 的坐标。其中，D、H 和 W 分别表示特征图的深度、高度和宽度，anchors 是一个包含多个 anchor boxes 的数组，每个 anchor box 是一个三元组 (w, h, aspect_ratio)，表示它的宽度、高度和宽高比。这段代码通过四重循环枚举所有可能的空间位置和 anchor box，然后计算每个 anchor box 的中心坐标和宽高，将它们存储在一个矩阵中返回。

Eigen::ArrayXXd windows(D * H * W * anchors.size(), 6); //Eigen::MatrixXd windows(D * H * W * anchors.size(), 6); int index = 0; Eigen::VectorXd oz(D), oh(H), ow(W); for (int z = 0; z < D; ++z) { oz[z] = offset + z * stride; } for (int y = 0; y < H; ++y) { oh[y] = offset + y * stride; } for (int x = 0; x < W; ++x) { ow[x] = offset + x * stride; } // 计算 anchor box 的坐标 for (int z = 0; z < D; ++z) { for (int y = 0; y < H; ++y) { for (int x = 0; x < W; ++x) { for (int a = 0; a < anchors.size(); ++a) { windows.row(index) << oz[z], oh[y], ow[x], anchors[a][0], anchors[a][1], anchors[a][2]; ++index; } } } } return windows;

这段代码是目标检测中计算所有 anchor boxes 的位置和大小的函数。首先，代码定义了一个 Eigen::ArrayXXd 类型的矩阵 windows，用于存储所有 anchor boxes 的位置和大小信息。矩阵的行数为 D * H * W * anchors.size()，表示总共有这么多个 anchor boxes，每个 anchor box 的信息包含 6 个数值，分别是它的中心坐标 (oz, oh, ow) 和宽高比 (w, h, aspect_ratio)。接下来，代码通过三个循环分别计算 D、H 和 W 个方向上 anchor boxes 的中心坐标。其中，offset 表示特征图的起始位置，stride 表示每个 anchor box 的步长。假设特征图的大小为 DxHxW，anchor box 的数量为 N，那么这三个循环的时间复杂度为 O(DxHxW)。最后，代码通过四重循环枚举所有可能的空间位置和 anchor box，计算每个 anchor box 的中心坐标和宽高，将它们存储在矩阵 windows 中，并返回该矩阵。这四重循环的时间复杂度为 O(DxHxWxN)，其中 N 表示 anchor box 的数量。因此，该函数的总时间复杂度为 O(DxHxWxN)。

解释代码：int post_process(int8_t* input0, int8_t* input1, int8_t* input2, int model_in_h, int model_in_w, float conf_threshold, float nms_threshold, float scale_w, float scale_h, std::vector<int32_t>& qnt_zps, std::vector<float>& qnt_scales, detect_result_group_t* group) { static int init = -1; if (init == -1) { int ret = 0; ret = loadLabelName(LABEL_NALE_TXT_PATH, labels); if (ret < 0) { return -1; } init = 0; } memset(group, 0, sizeof(detect_result_group_t)); std::vector<float> filterBoxes; std::vector<float> objProbs; std::vector<int> classId; // stride 8 int stride0 = 8; int grid_h0 = model_in_h / stride0; int grid_w0 = model_in_w / stride0; int validCount0 = 0; validCount0 = process(input0, (int)anchor0, grid_h0, grid_w0, model_in_h, model_in_w, stride0, filterBoxes, objProbs, classId, conf_threshold, qnt_zps[0], qnt_scales[0]); // stride 16 int stride1 = 16; int grid_h1 = model_in_h / stride1; int grid_w1 = model_in_w / stride1; int validCount1 = 0; validCount1 = process(input1, (int)anchor1, grid_h1, grid_w1, model_in_h, model_in_w, stride1, filterBoxes, objProbs, classId, conf_threshold, qnt_zps[1], qnt_scales[1]); // stride 32 int stride2 = 32; int grid_h2 = model_in_h / stride2; int grid_w2 = model_in_w / stride2; int validCount2 = 0; validCount2 = process(input2, (int)anchor2, grid_h2, grid_w2, model_in_h, model_in_w, stride2, filterBoxes, objProbs, classId, conf_threshold, qnt_zps[2], qnt_scales[2]); int validCount = validCount0 + validCount1 + validCount2; // no object detect if (validCount <= 0) { return 0; } std::vector<int> indexArray; for (int i = 0; i < validCount; ++i) { indexArray.push_back(i); } quick_sort_indice_inverse(objProbs, 0, validCount - 1, indexArray); std::set<int> class_set(std::begin(classId), std::end(classId)); for (auto c : class_set) { nms(validCount, filterBoxes, classId, indexArray, c, nms_threshold); } int last_count = 0; group->count = 0; / box valid detect target / for (int i = 0; i < validCount; ++i) { if (indexArray[i] == -1 || last_count >= OBJ_NUMB_MAX_SIZE) { continue; } int n = indexArray[i]; float x1 = filterBoxes[n 4 + 0]; float y1 = filterBoxes[n * 4 + 1]; float x2 = x1 + filterBoxes[n * 4 + 2]; float y2 = y1 + filterBoxes[n * 4 + 3]; int id = classId[n]; float obj_conf = objProbs[i]; group->results[last_count].box.left = (int)(clamp(x1, 0, model_in_w) / scale_w); group->results[last_count].box.top = (int)(clamp(y1, 0, model_in_h) / scale_h); group->results[last_count].box.right = (int)(clamp(x2, 0, model_in_w) / scale_w); group->results[last_count].box.bottom = (int)(clamp(y2, 0, model_in_h) / scale_h); group->results[last_count].prop = obj_conf; char* label = labels[id]; strncpy(group->results[last_count].name, label, OBJ_NAME_MAX_SIZE); // printf("result %2d: (%4d, %4d, %4d, %4d), %s\n", i, group->results[last_count].box.left, // group->results[last_count].box.top, // group->results[last_count].box.right, group->results[last_count].box.bottom, label); last_count++; } group->count = last_count; return 0; }

这段代码实现了目标检测的后处理函数，对模型输出的特征图进行处理，并生成检测结果。具体解释如下：函数参数： - `input0`、`input1`、`input2`：三个特征图的指针，分别对应 stride 为 8、16、32 的特征图。 - `model_in_h`、`model_in_w`：输入模型的高度和宽度。 - `conf_threshold`：目标置信度的阈值。 - `nms_threshold`：非极大值抑制的阈值。 - `scale_w`、`scale_h`：图像的缩放因子。 - `qnt_zps`、`qnt_scales`：量化参数。 - `group`：存储检测结果的指针。函数功能： 1. 首先，检查是否需要初始化标签名，如果是第一次调用函数，则加载标签名并保存在全局变量 `labels` 中。 2. 初始化存储检测结果的 `group` 结构体，并将其内存清零。 3. 创建用于存储过滤后的检测框位置和大小的向量 `filterBoxes`，以及存储目标置信度和类别编号的向量 `objProbs` 和 `classId`。 4. 对 stride 为 8 的特征图进行处理，计算有效目标数目，并将结果保存在 `validCount0` 中。 5. 对 stride 为 16 和 32 的特征图进行类似的处理，计算有效目标数目并分别保存在 `validCount1` 和 `validCount2` 中。 6. 计算总的有效目标数目 `validCount`，如果没有检测到目标，则直接返回。 7. 创建一个索引数组 `indexArray`，用于排序和非极大值抑制操作。 8. 使用快速排序算法 `quick_sort_indice_inverse` 对目标置信度 `objProbs` 进行降序排序，并记录索引的变化情况。 9. 创建一个集合 `class_set`，用于存储所有出现的类别编号。 10. 针对每个类别对目标框进行非极大值抑制操作，剔除重叠度较高的重复框，保留置信度最高的框。 11. 初始化最终检测结果计数器 `last_count` 和 `group->count`。 12. 遍历排序后的索引数组 `indexArray`，获取每个目标框的位置、大小、类别编号和置信度，并进行一些后处理操作。 13. 将检测结果转换为图像坐标，并保存在 `group->results` 中。 14. 更新最终检测结果计数器 `last_count`。 15. 将最终的检测结果数目保存在 `group->count` 中。 16. 返回 0 表示处理成功。通过这样的处理过程，可以从模型输出的特征图中提取出有效的目标检测结果，并进行非极大值抑制操作，最终生成包含检测框位置、大小、类别和置信度的结果。

// 计算 anchor box 的坐标 for (int z = 0; z < D; ++z) { for (int y = 0; y < H; ++y) { for (int x = 0; x < W; ++x) { for (int a = 0; a < anchors.size(); ++a) { windows.row(index) << oz[z], oh[y], ow[x], anchors[a][0], anchors[a][1], anchors[a][2]; ++index; } } } }

相关推荐

yolov3中kmeans算法生成Anchor Box脚本

在深度学习中bik-means算法、k-means算法和kmean++算法生成anchor框应用

Kmeans聚类算法获得anchor_box

用cpp写一个根据矩形锚框坐标切割深度图并输出切割后深度图尺寸的函数

用cpp写一个将输入的无序点云变为有序点云，并根据像素坐标形成的锚框进行切割的函数

用cpp写一个将xyz点云文件转为有序点云，根据输入像素坐标形成矩形锚框切割为新点云的函数

用cpp调用pcl库写一个将xyz无序点云转变为有序点云,根据输入像素坐标形成锚框切割生成新的点云的程序

目标识别中，如何使目标标注框大小不变。求Python代码

设计一个目标检测的UI界面的代码

FreeAnchor:Learning to match anchors for visual object detection论文翻译.doc

FreeAnchor:Learning to match anchors for visual object detecti翻译.pdf

基于NanoDet项目进行小裁剪，专门用来实现PyTorch 版本的python源码+文档说明

课程设计基于机器学习的Webshell中恶意函数检测源码+设计报告+样本数据.zip

JavaScript for in锚点的动态创建

A2J Anchor-to-Joint Regression Network for 3D Articulated Pose Estimation.pdf

Anchor-Intermediate Detector: object detection 目标检测组会汇报ppt

###对华为OD分布式操作系统的详细介绍

最新推荐

###对华为OD分布式操作系统的详细介绍

2110220116吴骏博.py

基于Java的ApplicationPower快速项目生成脚手架设计源码

基于MATLAB实现的OFDM经典同步算法之一Park算法仿真，附带Park算法经典文献+代码文档+使用说明文档.rar

基于MATLAB实现的imu和视觉里程计 kalman滤波器 进行融合+使用说明文档.rar

zigbee-cluster-library-specification

管理建模和仿真的文件

【实战演练】MATLAB用遗传算法改进粒子群GA-PSO算法

openstack的20种接口有哪些

JSBSim Reference Manual

基于MATLAB实现的imu和视觉里程计 kalman滤波器进行融合+使用说明文档.rar