Yolo_Pose姿态模型在arm linux的验证与部署
2026-06-03
1、下载模型转换项目rknn_model_zoo
github链接:https://github.com/airockchip/rknn_model_zoo/tree/main
2、在板子(瑞芯微)配置后对应的运行环境
- **rknn-toolkit2:**https://github.com/airockchip/rknn-toolkit2
- OpenCV
- Boost
- Eigen3
3、使用该项目下对应的后处理postprocess代码(很重要!!!)
这里是以yolo的姿态检测为例:
- 进入路径:cd /rknn_model_zoo/examples/yolov8_pose/cpp/
- 该路径下的代码都是在瑞芯微板子中运行目标姿态检测的代码
- 示例代码如下:
// 1、rknn初始化使用
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <math.h>
#include "yolov8-pose.h"
#include "common.h"
#include "file_utils.h"
#include "image_utils.h"
#include <sys/time.h>
static inline int64_t getCurrentTimeUs()
{
struct timeval tv;
gettimeofday(&tv, NULL);
return tv.tv_sec * 1000000 + tv.tv_usec;
}
static void dump_tensor_attr(rknn_tensor_attr *attr)
{
printf(" index=%d, name=%s, n_dims=%d, dims=[%d, %d, %d, %d], n_elems=%d, size=%d, fmt=%s, type=%s, qnt_type=%s, "
"zp=%d, scale=%f\n",
attr->index, attr->name, attr->n_dims, attr->dims[0], attr->dims[1], attr->dims[2], attr->dims[3],
attr->n_elems, attr->size, get_format_string(attr->fmt), get_type_string(attr->type),
get_qnt_type_string(attr->qnt_type), attr->zp, attr->scale);
}
int init_yolov8_pose_model(const char *model_path, rknn_app_context_t *app_ctx)
{
int ret;
rknn_context ctx = 0;
ret = rknn_init(&ctx, (char *)model_path, 0, 0, NULL);
if (ret < 0)
{
printf("rknn_init fail! ret=%d\n", ret);
return -1;
}
// Get Model Input Output Number
rknn_input_output_num io_num;
ret = rknn_query(ctx, RKNN_QUERY_IN_OUT_NUM, &io_num, sizeof(io_num));
if (ret != RKNN_SUCC)
{
printf("rknn_query fail! ret=%d\n", ret);
return -1;
}
printf("model input num: %d, output num: %d\n", io_num.n_input, io_num.n_output);
// Get Model Input Info
printf("input tensors:\n");
rknn_tensor_attr input_attrs[io_num.n_input];
memset(input_attrs, 0, sizeof(input_attrs));
for (int i = 0; i < io_num.n_input; i++)
{
input_attrs[i].index = i;
ret = rknn_query(ctx, RKNN_QUERY_INPUT_ATTR, &(input_attrs[i]), sizeof(rknn_tensor_attr));
if (ret != RKNN_SUCC)
{
printf("rknn_query fail! ret=%d\n", ret);
return -1;
}
dump_tensor_attr(&(input_attrs[i]));
}
// Get Model Output Info
printf("output tensors:\n");
rknn_tensor_attr output_attrs[io_num.n_output];
memset(output_attrs, 0, sizeof(output_attrs));
for (int i = 0; i < io_num.n_output; i++)
{
output_attrs[i].index = i;
ret = rknn_query(ctx, RKNN_QUERY_OUTPUT_ATTR, &(output_attrs[i]), sizeof(rknn_tensor_attr));
if (ret != RKNN_SUCC)
{
printf("rknn_query fail! ret=%d\n", ret);
return -1;
}
dump_tensor_attr(&(output_attrs[i]));
}
// Set to context
app_ctx->rknn_ctx = ctx;
// TODO
if (output_attrs[0].qnt_type == RKNN_TENSOR_QNT_AFFINE_ASYMMETRIC && output_attrs[0].type != RKNN_TENSOR_FLOAT16)
{
app_ctx->is_quant = true;
}
else
{
app_ctx->is_quant = false;
}
app_ctx->io_num = io_num;
app_ctx->input_attrs = (rknn_tensor_attr *)malloc(io_num.n_input * sizeof(rknn_tensor_attr));
memcpy(app_ctx->input_attrs, input_attrs, io_num.n_input * sizeof(rknn_tensor_attr));
app_ctx->output_attrs = (rknn_tensor_attr *)malloc(io_num.n_output * sizeof(rknn_tensor_attr));
memcpy(app_ctx->output_attrs, output_attrs, io_num.n_output * sizeof(rknn_tensor_attr));
if (input_attrs[0].fmt == RKNN_TENSOR_NCHW)
{
printf("model is NCHW input fmt\n");
app_ctx->model_channel = input_attrs[0].dims[1];
app_ctx->model_height = input_attrs[0].dims[2];
app_ctx->model_width = input_attrs[0].dims[3];
}
else
{
printf("model is NHWC input fmt\n");
app_ctx->model_height = input_attrs[0].dims[1];
app_ctx->model_width = input_attrs[0].dims[2];
app_ctx->model_channel = input_attrs[0].dims[3];
}
printf("model input height=%d, width=%d, channel=%d\n",
app_ctx->model_height, app_ctx->model_width, app_ctx->model_channel);
return 0;
}
int release_yolov8_pose_model(rknn_app_context_t *app_ctx)
{
if (app_ctx->input_attrs != NULL)
{
free(app_ctx->input_attrs);
app_ctx->input_attrs = NULL;
}
if (app_ctx->output_attrs != NULL)
{
free(app_ctx->output_attrs);
app_ctx->output_attrs = NULL;
}
if (app_ctx->rknn_ctx != 0)
{
rknn_destroy(app_ctx->rknn_ctx);
app_ctx->rknn_ctx = 0;
}
return 0;
}
int inference_yolov8_pose_model(rknn_app_context_t *app_ctx, image_buffer_t *img, object_detect_result_list *od_results)
{
int ret;
image_buffer_t dst_img;
letterbox_t letter_box;
rknn_input inputs[app_ctx->io_num.n_input];
rknn_output outputs[app_ctx->io_num.n_output];
const float nms_threshold = NMS_THRESH; // Default NMS threshold
const float box_conf_threshold = BOX_THRESH; // Default box threshold
int bg_color = 114;
if ((!app_ctx) || !(img) || (!od_results))
{
return -1;
}
memset(od_results, 0x00, sizeof(*od_results));
memset(&letter_box, 0, sizeof(letterbox_t));
memset(&dst_img, 0, sizeof(image_buffer_t));
memset(inputs, 0, sizeof(inputs));
memset(outputs, 0, sizeof(outputs));
// Pre Process
dst_img.width = app_ctx->model_width;
dst_img.height = app_ctx->model_height;
dst_img.format = IMAGE_FORMAT_RGB888;
dst_img.size = get_image_size(&dst_img);
dst_img.virt_addr = (unsigned char *)malloc(dst_img.size);
if (dst_img.virt_addr == NULL)
{
printf("malloc buffer size:%d fail!\n", dst_img.size);
goto out;
}
// letterbox
ret = convert_image_with_letterbox(img, &dst_img, &letter_box, bg_color);
if (ret < 0)
{
printf("convert_image_with_letterbox fail! ret=%d\n", ret);
goto out;
}
// Set Input Data
inputs[0].index = 0;
inputs[0].type = RKNN_TENSOR_UINT8;
inputs[0].fmt = RKNN_TENSOR_NHWC;
inputs[0].size = app_ctx->model_width * app_ctx->model_height * app_ctx->model_channel;
inputs[0].buf = dst_img.virt_addr;
ret = rknn_inputs_set(app_ctx->rknn_ctx, app_ctx->io_num.n_input, inputs);
if (ret < 0)
{
printf("rknn_input_set fail! ret=%d\n", ret);
goto out;
}
// Run
printf("rknn_run\n");
int start_us,end_us;
start_us = getCurrentTimeUs();
ret = rknn_run(app_ctx->rknn_ctx, nullptr);
end_us = getCurrentTimeUs() - start_us;
printf("rknn_run time=%.2fms, FPS = %.2f\n",end_us / 1000.f,
1000.f * 1000.f / end_us);
if (ret < 0)
{
printf("rknn_run fail! ret=%d\n", ret);
goto out;
}
// Get Output
memset(outputs, 0, sizeof(outputs));
for (int i = 0; i < app_ctx->io_num.n_output; i++)
{
outputs[i].index = i;
outputs[i].want_float = (!app_ctx->is_quant);
}
ret = rknn_outputs_get(app_ctx->rknn_ctx, app_ctx->io_num.n_output, outputs, NULL);
if (ret < 0)
{
printf("rknn_outputs_get fail! ret=%d\n", ret);
goto out;
}
// Post Process
start_us = getCurrentTimeUs();
post_process(app_ctx, outputs, &letter_box, box_conf_threshold, nms_threshold, od_results);
end_us = getCurrentTimeUs() - start_us;
printf("post_process time=%.2fms, FPS = %.2f\n",end_us / 1000.f,
1000.f * 1000.f / end_us);
// Remeber to release rknn output
rknn_outputs_release(app_ctx->rknn_ctx, app_ctx->io_num.n_output, outputs);
out:
if (dst_img.virt_addr != NULL)
{
free(dst_img.virt_addr);
}
return ret;
}
// 2、核心后处理代码(适配rk3588的代码,也就是RKNPU2)
#include "yolov8-pose.h"
#include <math.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <sys/time.h>
#include "Float16.h"
#include <set>
#include <vector>
#define LABEL_NALE_TXT_PATH "/home/app/bin/yolov8_pose_labels_list.txt"
static char *labels[OBJ_CLASS_NUM];
inline static int clamp(float val, int min, int max) { return val > min ? (val < max ? val : max) : min; }
static char *readLine(FILE *fp, char *buffer, int *len) {
int ch;
int i = 0;
size_t buff_len = 0;
buffer = (char *)malloc(buff_len + 1);
if (!buffer)
return NULL; // Out of memory
while ((ch = fgetc(fp)) != '\n' && ch != EOF) {
buff_len++;
void *tmp = realloc(buffer, buff_len + 1);
if (tmp == NULL) {
free(buffer);
return NULL; // Out of memory
}
buffer = (char *)tmp;
buffer[i] = (char)ch;
i++;
}
buffer[i] = '\0';
*len = buff_len;
// Detect end
if (ch == EOF && (i == 0 || ferror(fp))) {
free(buffer);
return NULL;
}
return buffer;
}
static int readLines(const char *fileName, char *lines[], int max_line) {
FILE *file = fopen(fileName, "r");
char *s;
int i = 0;
int n = 0;
if (file == NULL) {
printf("Open %s fail!\n", fileName);
return -1;
}
while ((s = readLine(file, s, &n)) != NULL) {
lines[i++] = s;
if (i >= max_line)
break;
}
fclose(file);
return i;
}
static int loadLabelName(const char *locationFilename, char *label[]) {
printf("load lable %s\n", locationFilename);
readLines(locationFilename, label, OBJ_CLASS_NUM);
return 0;
}
static float CalculateOverlap(float xmin0, float ymin0, float xmax0, float ymax0, float xmin1, float ymin1, float xmax1,
float ymax1)
{
float w = fmax(0.f, fmin(xmax0, xmax1) - fmax(xmin0, xmin1) + 1.0);
float h = fmax(0.f, fmin(ymax0, ymax1) - fmax(ymin0, ymin1) + 1.0);
float i = w * h;
float u = (xmax0 - xmin0 + 1.0) * (ymax0 - ymin0 + 1.0) + (xmax1 - xmin1 + 1.0) * (ymax1 - ymin1 + 1.0) - i;
return u <= 0.f ? 0.f : (i / u);
}
static int nms(int validCount, std::vector<float> &outputLocations, std::vector<int> classIds, std::vector<int> &order,
int filterId, float threshold)
{
for (int i = 0; i < validCount; ++i)
{
int n = order[i];
if (n == -1 || classIds[n] != filterId)
{
continue;
}
for (int j = i + 1; j < validCount; ++j)
{
int m = order[j];
if (m == -1 || classIds[m] != filterId)
{
continue;
}
float xmin0 = outputLocations[n * 5 + 0];
float ymin0 = outputLocations[n * 5 + 1];
float xmax0 = outputLocations[n * 5 + 0] + outputLocations[n * 5 + 2];
float ymax0 = outputLocations[n * 5 + 1] + outputLocations[n * 5 + 3];
float xmin1 = outputLocations[m * 5 + 0];
float ymin1 = outputLocations[m * 5 + 1];
float xmax1 = outputLocations[m * 5 + 0] + outputLocations[m * 5 + 2];
float ymax1 = outputLocations[m * 5 + 1] + outputLocations[m * 5 + 3];
float iou = CalculateOverlap(xmin0, ymin0, xmax0, ymax0, xmin1, ymin1, xmax1, ymax1);
if (iou > threshold)
{
order[j] = -1;
}
}
}
return 0;
}
static int quick_sort_indice_inverse(std::vector<float> &input, int left, int right, std::vector<int> &indices) {
float key;
int key_index;
int low = left;
int high = right;
if (left < right) {
key_index = indices[left];
key = input[left];
while (low < high) {
while (low < high && input[high] <= key) {
high--;
}
input[low] = input[high];
indices[low] = indices[high];
while (low < high && input[low] >= key) {
low++;
}
input[high] = input[low];
indices[high] = indices[low];
}
input[low] = key;
indices[low] = key_index;
quick_sort_indice_inverse(input, left, low - 1, indices);
quick_sort_indice_inverse(input, low + 1, right, indices);
}
return low;
}
static float sigmoid(float x) {
return 1.0 / (1.0 + expf(-x));
}
static float unsigmoid(float y) {
return -1.0 * logf((1.0 / y) - 1.0);
}
inline static int32_t __clip(float val, float min, float max) {
float f = val <= min ? min : (val >= max ? max : val);
return f;
}
static int8_t qnt_f32_to_affine(float f32, int32_t zp, float scale) {
float dst_val = (f32 / scale) + zp;
int8_t res = (int8_t)__clip(dst_val, -128, 127);
return res;
}
static uint8_t qnt_f32_to_affine_u8(float f32, int32_t zp, float scale) {
float dst_val = (f32 / scale) + zp;
uint8_t res = (uint8_t)__clip(dst_val, 0, 255);
return res;
}
static float deqnt_affine_to_f32(int8_t qnt, int32_t zp, float scale) {
return ((float)qnt - (float)zp) * scale;
}
static float deqnt_affine_u8_to_f32(uint8_t qnt, int32_t zp, float scale) {
return ((float)qnt - (float)zp) * scale;
}
void softmax(float *input, int size) {
float max_val = input[0];
for (int i = 1; i < size; ++i) {
if (input[i] > max_val) {
max_val = input[i];
}
}
float sum_exp = 0.0;
for (int i = 0; i < size; ++i) {
sum_exp += expf(input[i] - max_val);
}
for (int i = 0; i < size; ++i) {
input[i] = expf(input[i] - max_val) / sum_exp;
}
}
static int process_i8(int8_t *input, int grid_h, int grid_w, int stride,
std::vector<float> &boxes, std::vector<float> &boxScores, std::vector<int> &classId, float threshold,
int32_t zp, float scale, int index) {
int input_loc_len = 64;
int tensor_len = input_loc_len + OBJ_CLASS_NUM;
int validCount = 0;
int8_t thres_i8 = qnt_f32_to_affine(unsigmoid(threshold), zp, scale);
for (int h = 0; h < grid_h; h++) {
for (int w = 0; w < grid_w; w++) {
for (int a = 0; a < OBJ_CLASS_NUM; a++) {
if(input[(input_loc_len + a)*grid_w * grid_h + h * grid_w + w ] >= thres_i8) { //[1,tensor_len,grid_h,grid_w]
float box_conf_f32 = sigmoid(deqnt_affine_to_f32(input[(input_loc_len + a) * grid_w * grid_h + h * grid_w + w ],
zp, scale));
float loc[input_loc_len];
for (int i = 0; i < input_loc_len; ++i) {
loc[i] = deqnt_affine_to_f32(input[i * grid_w * grid_h + h * grid_w + w], zp, scale);
}
for (int i = 0; i < input_loc_len / 16; ++i) {
softmax(&loc[i * 16], 16);
}
float xywh_[4] = {0, 0, 0, 0};
float xywh[4] = {0, 0, 0, 0};
for (int dfl = 0; dfl < 16; ++dfl) {
xywh_[0] += loc[dfl] * dfl;
xywh_[1] += loc[1 * 16 + dfl] * dfl;
xywh_[2] += loc[2 * 16 + dfl] * dfl;
xywh_[3] += loc[3 * 16 + dfl] * dfl;
}
xywh_[0]=(w+0.5)-xywh_[0];
xywh_[1]=(h+0.5)-xywh_[1];
xywh_[2]=(w+0.5)+xywh_[2];
xywh_[3]=(h+0.5)+xywh_[3];
xywh[0]=((xywh_[0]+xywh_[2])/2)*stride;
xywh[1]=((xywh_[1]+xywh_[3])/2)*stride;
xywh[2]=(xywh_[2]-xywh_[0])*stride;
xywh[3]=(xywh_[3]-xywh_[1])*stride;
xywh[0]=xywh[0]-xywh[2]/2;
xywh[1]=xywh[1]-xywh[3]/2;
boxes.push_back(xywh[0]);//x
boxes.push_back(xywh[1]);//y
boxes.push_back(xywh[2]);//w
boxes.push_back(xywh[3]);//h
boxes.push_back(float(index + (h * grid_w) + w));//keypoints index
boxScores.push_back(box_conf_f32);
classId.push_back(a);
validCount++;
}
}
}
}
return validCount;
}
static int process_u8(uint8_t *input, int grid_h, int grid_w, int stride,
std::vector<float> &boxes, std::vector<float> &boxScores, std::vector<int> &classId, float threshold,
int32_t zp, float scale, int index) {
int input_loc_len = 64;
int tensor_len = input_loc_len + OBJ_CLASS_NUM;
int validCount = 0;
uint8_t thres_i8 = qnt_f32_to_affine_u8(unsigmoid(threshold), zp, scale);
for (int h = 0; h < grid_h; h++) {
for (int w = 0; w < grid_w; w++) {
for (int a = 0; a < OBJ_CLASS_NUM; a++) {
if(input[(input_loc_len + a)*grid_w * grid_h + h * grid_w + w ] >= thres_i8) { //[1,tensor_len,grid_h,grid_w]
float box_conf_f32 = sigmoid(deqnt_affine_u8_to_f32(input[(input_loc_len + a) * grid_w * grid_h + h * grid_w + w ],
zp, scale));
float loc[input_loc_len];
for (int i = 0; i < input_loc_len; ++i) {
loc[i] = deqnt_affine_u8_to_f32(input[i * grid_w * grid_h + h * grid_w + w], zp, scale);
}
for (int i = 0; i < input_loc_len / 16; ++i) {
softmax(&loc[i * 16], 16);
}
float xywh_[4] = {0, 0, 0, 0};
float xywh[4] = {0, 0, 0, 0};
for (int dfl = 0; dfl < 16; ++dfl) {
xywh_[0] += loc[dfl] * dfl;
xywh_[1] += loc[1 * 16 + dfl] * dfl;
xywh_[2] += loc[2 * 16 + dfl] * dfl;
xywh_[3] += loc[3 * 16 + dfl] * dfl;
}
xywh_[0]=(w+0.5)-xywh_[0];
xywh_[1]=(h+0.5)-xywh_[1];
xywh_[2]=(w+0.5)+xywh_[2];
xywh_[3]=(h+0.5)+xywh_[3];
xywh[0]=((xywh_[0]+xywh_[2])/2)*stride;
xywh[1]=((xywh_[1]+xywh_[3])/2)*stride;
xywh[2]=(xywh_[2]-xywh_[0])*stride;
xywh[3]=(xywh_[3]-xywh_[1])*stride;
xywh[0]=xywh[0]-xywh[2]/2;
xywh[1]=xywh[1]-xywh[3]/2;
boxes.push_back(xywh[0]);//x
boxes.push_back(xywh[1]);//y
boxes.push_back(xywh[2]);//w
boxes.push_back(xywh[3]);//h
boxes.push_back(float(index + (h * grid_w) + w));//keypoints index
boxScores.push_back(box_conf_f32);
classId.push_back(a);
validCount++;
}
}
}
}
return validCount;
}
static int process_fp32(float *input, int grid_h, int grid_w, int stride,
std::vector<float> &boxes, std::vector<float> &boxScores, std::vector<int> &classId, float threshold,
int32_t zp, float scale, int index) {
int input_loc_len = 64;
int tensor_len = input_loc_len + OBJ_CLASS_NUM;
int validCount = 0;
float thres_fp = unsigmoid(threshold);
for (int h = 0; h < grid_h; h++) {
for (int w = 0; w < grid_w; w++) {
for (int a = 0; a < OBJ_CLASS_NUM; a++) {
if(input[(input_loc_len + a)*grid_w * grid_h + h * grid_w + w ] >= thres_fp) { //[1,tensor_len,grid_h,grid_w]
float box_conf_f32 = sigmoid(input[(input_loc_len + a) * grid_w * grid_h + h * grid_w + w ]);
float loc[input_loc_len];
for (int i = 0; i < input_loc_len; ++i) {
loc[i] = input[i * grid_w * grid_h + h * grid_w + w];
}
for (int i = 0; i < input_loc_len / 16; ++i) {
softmax(&loc[i * 16], 16);
}
float xywh_[4] = {0, 0, 0, 0};
float xywh[4] = {0, 0, 0, 0};
for (int dfl = 0; dfl < 16; ++dfl) {
xywh_[0] += loc[dfl] * dfl;
xywh_[1] += loc[1 * 16 + dfl] * dfl;
xywh_[2] += loc[2 * 16 + dfl] * dfl;
xywh_[3] += loc[3 * 16 + dfl] * dfl;
}
xywh_[0]=(w+0.5)-xywh_[0];
xywh_[1]=(h+0.5)-xywh_[1];
xywh_[2]=(w+0.5)+xywh_[2];
xywh_[3]=(h+0.5)+xywh_[3];
xywh[0]=((xywh_[0]+xywh_[2])/2)*stride;
xywh[1]=((xywh_[1]+xywh_[3])/2)*stride;
xywh[2]=(xywh_[2]-xywh_[0])*stride;
xywh[3]=(xywh_[3]-xywh_[1])*stride;
xywh[0]=xywh[0]-xywh[2]/2;
xywh[1]=xywh[1]-xywh[3]/2;
boxes.push_back(xywh[0]);//x
boxes.push_back(xywh[1]);//y
boxes.push_back(xywh[2]);//w
boxes.push_back(xywh[3]);//h
boxes.push_back(float(index + (h * grid_w) + w));//keypoints index
boxScores.push_back(box_conf_f32);
classId.push_back(a);
validCount++;
}
}
}
}
return validCount;
}
int post_process(rknn_app_context_t *app_ctx, rknn_output *outputs, letterbox_t *letter_box, float conf_threshold, float nms_threshold, object_detect_result_list *od_results)
{
std::vector<float> filterBoxes;
std::vector<float> objProbs;
std::vector<int> classId;
int validCount = 0;
int stride = 0;
int grid_h = 0;
int grid_w = 0;
int model_in_w = app_ctx->model_width;
int model_in_h = app_ctx->model_height;
memset(od_results, 0, sizeof(object_detect_result_list));
int index = 0;
// 处理三个输出层
for (int i = 0; i < 3; i++) {
grid_h = app_ctx->output_attrs[i].dims[2];
grid_w = app_ctx->output_attrs[i].dims[3];
stride = model_in_h / grid_h;
if (app_ctx->is_quant) {
validCount += process_i8((int8_t *)outputs[i].buf, grid_h, grid_w, stride, filterBoxes, objProbs,
classId, conf_threshold, app_ctx->output_attrs[i].zp, app_ctx->output_attrs[i].scale,index);
}
else
{
validCount += process_fp32((float *)outputs[i].buf, grid_h, grid_w, stride, filterBoxes, objProbs,
classId, conf_threshold, app_ctx->output_attrs[i].zp, app_ctx->output_attrs[i].scale, index);
}
index += grid_h * grid_w;
}
// no object detect
if (validCount <= 0) {
return 0;
}
std::vector<int> indexArray;
for (int i = 0; i < validCount; ++i) {
indexArray.push_back(i);
}
quick_sort_indice_inverse(objProbs, 0, validCount - 1, indexArray);
std::set<int> class_set(std::begin(classId), std::end(classId));
for (auto c : class_set) {
nms(validCount, filterBoxes, classId, indexArray, c, nms_threshold);
}
int last_count = 0;
od_results->count = 0;
/* box valid detect target */
for (int i = 0; i < validCount; ++i) {
if (indexArray[i] == -1 || last_count >= OBJ_NUMB_MAX_SIZE) {
continue;
}
int n = indexArray[i];
float x1 = filterBoxes[n * 5 + 0] - letter_box->x_pad;
float y1 = filterBoxes[n * 5 + 1] - letter_box->y_pad;
float w = filterBoxes[n * 5 + 2];
float h = filterBoxes[n * 5 + 3];
// if (n * 5 + 4 >= filterBoxes.size()) {
// fprintf(stderr, "filterBoxes access out of bound\n");
// return -1;
// }
int keypoints_index = (int)filterBoxes[n * 5 + 4];
// if (outputs[3].buf == nullptr) {
// fprintf(stderr, "Error: outputs[3] is not available or buffer is NULL\n");
// return -1;
// }
for (int j = 0; j < 17; ++j) {
// if (outputs[i].buf == nullptr) {
// fprintf(stderr, "Error: outputs[%d].buf is NULL\n", i);
// return -1;
// }
if (app_ctx->is_quant) {
od_results->results[last_count].keypoints[j][0] = ((float)((rknpu2::float16 *)outputs[3].buf)[j*3*8400+0*8400+keypoints_index]
- letter_box->x_pad)/ letter_box->scale;
od_results->results[last_count].keypoints[j][1] = ((float)((rknpu2::float16 *)outputs[3].buf)[j*3*8400+1*8400+keypoints_index]
- letter_box->y_pad)/ letter_box->scale;
od_results->results[last_count].keypoints[j][2] = (float)((rknpu2::float16 *)outputs[3].buf)[j*3*8400+2*8400+keypoints_index];
}
else
{
od_results->results[last_count].keypoints[j][0] = (((float *)outputs[3].buf)[j*3*8400+0*8400+keypoints_index]
- letter_box->x_pad)/ letter_box->scale;
od_results->results[last_count].keypoints[j][1] = (((float *)outputs[3].buf)[j*3*8400+1*8400+keypoints_index]
- letter_box->y_pad)/ letter_box->scale;
od_results->results[last_count].keypoints[j][2] = ((float *)outputs[3].buf)[j*3*8400+2*8400+keypoints_index];
}
}
int id = classId[n];
float obj_conf = objProbs[i];
od_results->results[last_count].box.left = (int)(clamp(x1, 0, model_in_w) / letter_box->scale);
od_results->results[last_count].box.top = (int)(clamp(y1, 0, model_in_h) / letter_box->scale);
od_results->results[last_count].box.right = (int)(clamp(x1+w, 0, model_in_w) / letter_box->scale);
od_results->results[last_count].box.bottom = (int)(clamp(y1+h, 0, model_in_h) / letter_box->scale);
// od_results->results[last_count].box.angle = angle;
od_results->results[last_count].prop = obj_conf;
od_results->results[last_count].cls_id = id;
last_count++;
}
od_results->count = last_count;
return 0;
}
int init_post_process() {
int ret = 0;
ret = loadLabelName(LABEL_NALE_TXT_PATH, labels);
if (ret < 0) {
printf("Load %s failed!\n", LABEL_NALE_TXT_PATH);
return -1;
}
return 0;
}
char *coco_cls_to_name(int cls_id) {
if (cls_id >= OBJ_CLASS_NUM) {
return "null";
}
if (labels[cls_id]) {
return labels[cls_id];
}
return "null";
}
void deinit_post_process() {
for (int i = 0; i < OBJ_CLASS_NUM; i++) {
if (labels[i] != nullptr) {
free(labels[i]);
labels[i] = nullptr;
}
}
}