Yolo_Pose姿态模型在arm linux的验证与部署
2802 字
14 分钟
Yolo_Pose姿态模型在arm linux的验证与部署
1、下载模型转换项目rknn_model_zoo
github链接:https://github.com/airockchip/rknn_model_zoo/tree/main
2、在板子(瑞芯微)配置后对应的运行环境
- **rknn-toolkit2:**https://github.com/airockchip/rknn-toolkit2
- OpenCV
- Boost
- Eigen3
3、使用该项目下对应的后处理postprocess代码(很重要!!!)
这里是以yolo的姿态检测为例:
- 进入路径
/rknn_model_zoo/examples/yolov8_pose/cpp/ - 该路径下的代码都是在瑞芯微板子中运行目标姿态检测的代码
- 示例代码如下:
// 1、rknn初始化使用#include <stdio.h>#include <stdlib.h>#include <string.h>#include <math.h>
#include "yolov8-pose.h"#include "common.h"#include "file_utils.h"#include "image_utils.h"
#include <sys/time.h>
static inline int64_t getCurrentTimeUs(){ struct timeval tv; gettimeofday(&tv, NULL); return tv.tv_sec * 1000000 + tv.tv_usec;}
static void dump_tensor_attr(rknn_tensor_attr *attr){ printf(" index=%d, name=%s, n_dims=%d, dims=[%d, %d, %d, %d], n_elems=%d, size=%d, fmt=%s, type=%s, qnt_type=%s, " "zp=%d, scale=%f\n", attr->index, attr->name, attr->n_dims, attr->dims[0], attr->dims[1], attr->dims[2], attr->dims[3], attr->n_elems, attr->size, get_format_string(attr->fmt), get_type_string(attr->type), get_qnt_type_string(attr->qnt_type), attr->zp, attr->scale);}
int init_yolov8_pose_model(const char *model_path, rknn_app_context_t *app_ctx){ int ret; rknn_context ctx = 0;
ret = rknn_init(&ctx, (char *)model_path, 0, 0, NULL); if (ret < 0) { printf("rknn_init fail! ret=%d\n", ret); return -1; }
// Get Model Input Output Number rknn_input_output_num io_num; ret = rknn_query(ctx, RKNN_QUERY_IN_OUT_NUM, &io_num, sizeof(io_num)); if (ret != RKNN_SUCC) { printf("rknn_query fail! ret=%d\n", ret); return -1; } printf("model input num: %d, output num: %d\n", io_num.n_input, io_num.n_output);
// Get Model Input Info printf("input tensors:\n"); rknn_tensor_attr input_attrs[io_num.n_input]; memset(input_attrs, 0, sizeof(input_attrs)); for (int i = 0; i < io_num.n_input; i++) { input_attrs[i].index = i; ret = rknn_query(ctx, RKNN_QUERY_INPUT_ATTR, &(input_attrs[i]), sizeof(rknn_tensor_attr)); if (ret != RKNN_SUCC) { printf("rknn_query fail! ret=%d\n", ret); return -1; } dump_tensor_attr(&(input_attrs[i])); }
// Get Model Output Info printf("output tensors:\n"); rknn_tensor_attr output_attrs[io_num.n_output]; memset(output_attrs, 0, sizeof(output_attrs)); for (int i = 0; i < io_num.n_output; i++) { output_attrs[i].index = i; ret = rknn_query(ctx, RKNN_QUERY_OUTPUT_ATTR, &(output_attrs[i]), sizeof(rknn_tensor_attr)); if (ret != RKNN_SUCC) { printf("rknn_query fail! ret=%d\n", ret); return -1; } dump_tensor_attr(&(output_attrs[i])); }
// Set to context app_ctx->rknn_ctx = ctx;
// TODO if (output_attrs[0].qnt_type == RKNN_TENSOR_QNT_AFFINE_ASYMMETRIC && output_attrs[0].type != RKNN_TENSOR_FLOAT16) { app_ctx->is_quant = true; } else { app_ctx->is_quant = false; }
app_ctx->io_num = io_num; app_ctx->input_attrs = (rknn_tensor_attr *)malloc(io_num.n_input * sizeof(rknn_tensor_attr)); memcpy(app_ctx->input_attrs, input_attrs, io_num.n_input * sizeof(rknn_tensor_attr)); app_ctx->output_attrs = (rknn_tensor_attr *)malloc(io_num.n_output * sizeof(rknn_tensor_attr)); memcpy(app_ctx->output_attrs, output_attrs, io_num.n_output * sizeof(rknn_tensor_attr));
if (input_attrs[0].fmt == RKNN_TENSOR_NCHW) { printf("model is NCHW input fmt\n"); app_ctx->model_channel = input_attrs[0].dims[1]; app_ctx->model_height = input_attrs[0].dims[2]; app_ctx->model_width = input_attrs[0].dims[3]; } else { printf("model is NHWC input fmt\n"); app_ctx->model_height = input_attrs[0].dims[1]; app_ctx->model_width = input_attrs[0].dims[2]; app_ctx->model_channel = input_attrs[0].dims[3]; } printf("model input height=%d, width=%d, channel=%d\n", app_ctx->model_height, app_ctx->model_width, app_ctx->model_channel);
return 0;}
int release_yolov8_pose_model(rknn_app_context_t *app_ctx){ if (app_ctx->input_attrs != NULL) { free(app_ctx->input_attrs); app_ctx->input_attrs = NULL; } if (app_ctx->output_attrs != NULL) { free(app_ctx->output_attrs); app_ctx->output_attrs = NULL; } if (app_ctx->rknn_ctx != 0) { rknn_destroy(app_ctx->rknn_ctx); app_ctx->rknn_ctx = 0; } return 0;}
int inference_yolov8_pose_model(rknn_app_context_t *app_ctx, image_buffer_t *img, object_detect_result_list *od_results){ int ret; image_buffer_t dst_img; letterbox_t letter_box; rknn_input inputs[app_ctx->io_num.n_input]; rknn_output outputs[app_ctx->io_num.n_output]; const float nms_threshold = NMS_THRESH; // Default NMS threshold const float box_conf_threshold = BOX_THRESH; // Default box threshold int bg_color = 114;
if ((!app_ctx) || !(img) || (!od_results)) { return -1; }
memset(od_results, 0x00, sizeof(*od_results)); memset(&letter_box, 0, sizeof(letterbox_t)); memset(&dst_img, 0, sizeof(image_buffer_t)); memset(inputs, 0, sizeof(inputs)); memset(outputs, 0, sizeof(outputs));
// Pre Process dst_img.width = app_ctx->model_width; dst_img.height = app_ctx->model_height; dst_img.format = IMAGE_FORMAT_RGB888; dst_img.size = get_image_size(&dst_img); dst_img.virt_addr = (unsigned char *)malloc(dst_img.size); if (dst_img.virt_addr == NULL) { printf("malloc buffer size:%d fail!\n", dst_img.size); goto out; }
// letterbox ret = convert_image_with_letterbox(img, &dst_img, &letter_box, bg_color); if (ret < 0) { printf("convert_image_with_letterbox fail! ret=%d\n", ret); goto out; } // Set Input Data inputs[0].index = 0; inputs[0].type = RKNN_TENSOR_UINT8; inputs[0].fmt = RKNN_TENSOR_NHWC; inputs[0].size = app_ctx->model_width * app_ctx->model_height * app_ctx->model_channel; inputs[0].buf = dst_img.virt_addr;
ret = rknn_inputs_set(app_ctx->rknn_ctx, app_ctx->io_num.n_input, inputs); if (ret < 0) { printf("rknn_input_set fail! ret=%d\n", ret); goto out; }
// Run printf("rknn_run\n"); int start_us,end_us; start_us = getCurrentTimeUs(); ret = rknn_run(app_ctx->rknn_ctx, nullptr); end_us = getCurrentTimeUs() - start_us; printf("rknn_run time=%.2fms, FPS = %.2f\n",end_us / 1000.f, 1000.f * 1000.f / end_us);
if (ret < 0) { printf("rknn_run fail! ret=%d\n", ret); goto out; }
// Get Output memset(outputs, 0, sizeof(outputs)); for (int i = 0; i < app_ctx->io_num.n_output; i++) { outputs[i].index = i; outputs[i].want_float = (!app_ctx->is_quant); } ret = rknn_outputs_get(app_ctx->rknn_ctx, app_ctx->io_num.n_output, outputs, NULL); if (ret < 0) { printf("rknn_outputs_get fail! ret=%d\n", ret); goto out; } // Post Process start_us = getCurrentTimeUs(); post_process(app_ctx, outputs, &letter_box, box_conf_threshold, nms_threshold, od_results); end_us = getCurrentTimeUs() - start_us; printf("post_process time=%.2fms, FPS = %.2f\n",end_us / 1000.f, 1000.f * 1000.f / end_us); // Remeber to release rknn output rknn_outputs_release(app_ctx->rknn_ctx, app_ctx->io_num.n_output, outputs);
out: if (dst_img.virt_addr != NULL) { free(dst_img.virt_addr); }
return ret;}
// 2、核心后处理代码(适配rk3588的代码,也就是RKNPU2)#include "yolov8-pose.h"#include <math.h>#include <stdint.h>#include <stdio.h>#include <stdlib.h>#include <string.h>#include <sys/time.h>
#include "Float16.h"
#include <set>#include <vector>#define LABEL_NALE_TXT_PATH "/home/app/bin/yolov8_pose_labels_list.txt"
static char *labels[OBJ_CLASS_NUM];
inline static int clamp(float val, int min, int max) { return val > min ? (val < max ? val : max) : min; }
static char *readLine(FILE *fp, char *buffer, int *len) { int ch; int i = 0; size_t buff_len = 0;
buffer = (char *)malloc(buff_len + 1); if (!buffer) return NULL; // Out of memory
while ((ch = fgetc(fp)) != '\n' && ch != EOF) { buff_len++; void *tmp = realloc(buffer, buff_len + 1); if (tmp == NULL) { free(buffer); return NULL; // Out of memory } buffer = (char *)tmp;
buffer[i] = (char)ch; i++; } buffer[i] = '\0';
*len = buff_len;
// Detect end if (ch == EOF && (i == 0 || ferror(fp))) { free(buffer); return NULL; } return buffer;}
static int readLines(const char *fileName, char *lines[], int max_line) { FILE *file = fopen(fileName, "r"); char *s; int i = 0; int n = 0;
if (file == NULL) { printf("Open %s fail!\n", fileName); return -1; }
while ((s = readLine(file, s, &n)) != NULL) { lines[i++] = s; if (i >= max_line) break; } fclose(file); return i;}
static int loadLabelName(const char *locationFilename, char *label[]) { printf("load lable %s\n", locationFilename); readLines(locationFilename, label, OBJ_CLASS_NUM); return 0;}
static float CalculateOverlap(float xmin0, float ymin0, float xmax0, float ymax0, float xmin1, float ymin1, float xmax1, float ymax1){ float w = fmax(0.f, fmin(xmax0, xmax1) - fmax(xmin0, xmin1) + 1.0); float h = fmax(0.f, fmin(ymax0, ymax1) - fmax(ymin0, ymin1) + 1.0); float i = w * h; float u = (xmax0 - xmin0 + 1.0) * (ymax0 - ymin0 + 1.0) + (xmax1 - xmin1 + 1.0) * (ymax1 - ymin1 + 1.0) - i; return u <= 0.f ? 0.f : (i / u);}
static int nms(int validCount, std::vector<float> &outputLocations, std::vector<int> classIds, std::vector<int> &order, int filterId, float threshold){ for (int i = 0; i < validCount; ++i) { int n = order[i]; if (n == -1 || classIds[n] != filterId) { continue; } for (int j = i + 1; j < validCount; ++j) { int m = order[j]; if (m == -1 || classIds[m] != filterId) { continue; } float xmin0 = outputLocations[n * 5 + 0]; float ymin0 = outputLocations[n * 5 + 1]; float xmax0 = outputLocations[n * 5 + 0] + outputLocations[n * 5 + 2]; float ymax0 = outputLocations[n * 5 + 1] + outputLocations[n * 5 + 3];
float xmin1 = outputLocations[m * 5 + 0]; float ymin1 = outputLocations[m * 5 + 1]; float xmax1 = outputLocations[m * 5 + 0] + outputLocations[m * 5 + 2]; float ymax1 = outputLocations[m * 5 + 1] + outputLocations[m * 5 + 3];
float iou = CalculateOverlap(xmin0, ymin0, xmax0, ymax0, xmin1, ymin1, xmax1, ymax1);
if (iou > threshold) { order[j] = -1; } } } return 0;}
static int quick_sort_indice_inverse(std::vector<float> &input, int left, int right, std::vector<int> &indices) { float key; int key_index; int low = left; int high = right; if (left < right) { key_index = indices[left]; key = input[left]; while (low < high) { while (low < high && input[high] <= key) { high--; } input[low] = input[high]; indices[low] = indices[high]; while (low < high && input[low] >= key) { low++; } input[high] = input[low]; indices[high] = indices[low]; } input[low] = key; indices[low] = key_index; quick_sort_indice_inverse(input, left, low - 1, indices); quick_sort_indice_inverse(input, low + 1, right, indices); } return low;}
static float sigmoid(float x) { return 1.0 / (1.0 + expf(-x));}
static float unsigmoid(float y) { return -1.0 * logf((1.0 / y) - 1.0);}
inline static int32_t __clip(float val, float min, float max) { float f = val <= min ? min : (val >= max ? max : val); return f;}
static int8_t qnt_f32_to_affine(float f32, int32_t zp, float scale) { float dst_val = (f32 / scale) + zp; int8_t res = (int8_t)__clip(dst_val, -128, 127); return res;}
static uint8_t qnt_f32_to_affine_u8(float f32, int32_t zp, float scale) { float dst_val = (f32 / scale) + zp; uint8_t res = (uint8_t)__clip(dst_val, 0, 255); return res;}
static float deqnt_affine_to_f32(int8_t qnt, int32_t zp, float scale) { return ((float)qnt - (float)zp) * scale;}static float deqnt_affine_u8_to_f32(uint8_t qnt, int32_t zp, float scale) { return ((float)qnt - (float)zp) * scale;}
void softmax(float *input, int size) { float max_val = input[0]; for (int i = 1; i < size; ++i) { if (input[i] > max_val) { max_val = input[i]; } }
float sum_exp = 0.0; for (int i = 0; i < size; ++i) { sum_exp += expf(input[i] - max_val); }
for (int i = 0; i < size; ++i) { input[i] = expf(input[i] - max_val) / sum_exp; }}
static int process_i8(int8_t *input, int grid_h, int grid_w, int stride, std::vector<float> &boxes, std::vector<float> &boxScores, std::vector<int> &classId, float threshold, int32_t zp, float scale, int index) { int input_loc_len = 64; int tensor_len = input_loc_len + OBJ_CLASS_NUM; int validCount = 0;
int8_t thres_i8 = qnt_f32_to_affine(unsigmoid(threshold), zp, scale); for (int h = 0; h < grid_h; h++) { for (int w = 0; w < grid_w; w++) { for (int a = 0; a < OBJ_CLASS_NUM; a++) { if(input[(input_loc_len + a)*grid_w * grid_h + h * grid_w + w ] >= thres_i8) { //[1,tensor_len,grid_h,grid_w] float box_conf_f32 = sigmoid(deqnt_affine_to_f32(input[(input_loc_len + a) * grid_w * grid_h + h * grid_w + w ], zp, scale)); float loc[input_loc_len]; for (int i = 0; i < input_loc_len; ++i) { loc[i] = deqnt_affine_to_f32(input[i * grid_w * grid_h + h * grid_w + w], zp, scale); }
for (int i = 0; i < input_loc_len / 16; ++i) { softmax(&loc[i * 16], 16); } float xywh_[4] = {0, 0, 0, 0}; float xywh[4] = {0, 0, 0, 0}; for (int dfl = 0; dfl < 16; ++dfl) { xywh_[0] += loc[dfl] * dfl; xywh_[1] += loc[1 * 16 + dfl] * dfl; xywh_[2] += loc[2 * 16 + dfl] * dfl; xywh_[3] += loc[3 * 16 + dfl] * dfl; } xywh_[0]=(w+0.5)-xywh_[0]; xywh_[1]=(h+0.5)-xywh_[1]; xywh_[2]=(w+0.5)+xywh_[2]; xywh_[3]=(h+0.5)+xywh_[3]; xywh[0]=((xywh_[0]+xywh_[2])/2)*stride; xywh[1]=((xywh_[1]+xywh_[3])/2)*stride; xywh[2]=(xywh_[2]-xywh_[0])*stride; xywh[3]=(xywh_[3]-xywh_[1])*stride; xywh[0]=xywh[0]-xywh[2]/2; xywh[1]=xywh[1]-xywh[3]/2; boxes.push_back(xywh[0]);//x boxes.push_back(xywh[1]);//y boxes.push_back(xywh[2]);//w boxes.push_back(xywh[3]);//h boxes.push_back(float(index + (h * grid_w) + w));//keypoints index boxScores.push_back(box_conf_f32); classId.push_back(a); validCount++; } } } } return validCount;}
static int process_u8(uint8_t *input, int grid_h, int grid_w, int stride, std::vector<float> &boxes, std::vector<float> &boxScores, std::vector<int> &classId, float threshold, int32_t zp, float scale, int index) { int input_loc_len = 64; int tensor_len = input_loc_len + OBJ_CLASS_NUM; int validCount = 0;
uint8_t thres_i8 = qnt_f32_to_affine_u8(unsigmoid(threshold), zp, scale); for (int h = 0; h < grid_h; h++) { for (int w = 0; w < grid_w; w++) { for (int a = 0; a < OBJ_CLASS_NUM; a++) { if(input[(input_loc_len + a)*grid_w * grid_h + h * grid_w + w ] >= thres_i8) { //[1,tensor_len,grid_h,grid_w] float box_conf_f32 = sigmoid(deqnt_affine_u8_to_f32(input[(input_loc_len + a) * grid_w * grid_h + h * grid_w + w ], zp, scale)); float loc[input_loc_len]; for (int i = 0; i < input_loc_len; ++i) { loc[i] = deqnt_affine_u8_to_f32(input[i * grid_w * grid_h + h * grid_w + w], zp, scale); }
for (int i = 0; i < input_loc_len / 16; ++i) { softmax(&loc[i * 16], 16); } float xywh_[4] = {0, 0, 0, 0}; float xywh[4] = {0, 0, 0, 0}; for (int dfl = 0; dfl < 16; ++dfl) { xywh_[0] += loc[dfl] * dfl; xywh_[1] += loc[1 * 16 + dfl] * dfl; xywh_[2] += loc[2 * 16 + dfl] * dfl; xywh_[3] += loc[3 * 16 + dfl] * dfl; } xywh_[0]=(w+0.5)-xywh_[0]; xywh_[1]=(h+0.5)-xywh_[1]; xywh_[2]=(w+0.5)+xywh_[2]; xywh_[3]=(h+0.5)+xywh_[3]; xywh[0]=((xywh_[0]+xywh_[2])/2)*stride; xywh[1]=((xywh_[1]+xywh_[3])/2)*stride; xywh[2]=(xywh_[2]-xywh_[0])*stride; xywh[3]=(xywh_[3]-xywh_[1])*stride; xywh[0]=xywh[0]-xywh[2]/2; xywh[1]=xywh[1]-xywh[3]/2; boxes.push_back(xywh[0]);//x boxes.push_back(xywh[1]);//y boxes.push_back(xywh[2]);//w boxes.push_back(xywh[3]);//h boxes.push_back(float(index + (h * grid_w) + w));//keypoints index boxScores.push_back(box_conf_f32); classId.push_back(a); validCount++; } } } } return validCount;}
static int process_fp32(float *input, int grid_h, int grid_w, int stride, std::vector<float> &boxes, std::vector<float> &boxScores, std::vector<int> &classId, float threshold, int32_t zp, float scale, int index) { int input_loc_len = 64; int tensor_len = input_loc_len + OBJ_CLASS_NUM; int validCount = 0; float thres_fp = unsigmoid(threshold); for (int h = 0; h < grid_h; h++) { for (int w = 0; w < grid_w; w++) { for (int a = 0; a < OBJ_CLASS_NUM; a++) { if(input[(input_loc_len + a)*grid_w * grid_h + h * grid_w + w ] >= thres_fp) { //[1,tensor_len,grid_h,grid_w] float box_conf_f32 = sigmoid(input[(input_loc_len + a) * grid_w * grid_h + h * grid_w + w ]); float loc[input_loc_len]; for (int i = 0; i < input_loc_len; ++i) { loc[i] = input[i * grid_w * grid_h + h * grid_w + w]; }
for (int i = 0; i < input_loc_len / 16; ++i) { softmax(&loc[i * 16], 16); } float xywh_[4] = {0, 0, 0, 0}; float xywh[4] = {0, 0, 0, 0}; for (int dfl = 0; dfl < 16; ++dfl) { xywh_[0] += loc[dfl] * dfl; xywh_[1] += loc[1 * 16 + dfl] * dfl; xywh_[2] += loc[2 * 16 + dfl] * dfl; xywh_[3] += loc[3 * 16 + dfl] * dfl; } xywh_[0]=(w+0.5)-xywh_[0]; xywh_[1]=(h+0.5)-xywh_[1]; xywh_[2]=(w+0.5)+xywh_[2]; xywh_[3]=(h+0.5)+xywh_[3]; xywh[0]=((xywh_[0]+xywh_[2])/2)*stride; xywh[1]=((xywh_[1]+xywh_[3])/2)*stride; xywh[2]=(xywh_[2]-xywh_[0])*stride; xywh[3]=(xywh_[3]-xywh_[1])*stride; xywh[0]=xywh[0]-xywh[2]/2; xywh[1]=xywh[1]-xywh[3]/2; boxes.push_back(xywh[0]);//x boxes.push_back(xywh[1]);//y boxes.push_back(xywh[2]);//w boxes.push_back(xywh[3]);//h boxes.push_back(float(index + (h * grid_w) + w));//keypoints index boxScores.push_back(box_conf_f32); classId.push_back(a); validCount++; } } } } return validCount;}
int post_process(rknn_app_context_t *app_ctx, rknn_output *outputs, letterbox_t *letter_box, float conf_threshold, float nms_threshold, object_detect_result_list *od_results){ std::vector<float> filterBoxes; std::vector<float> objProbs; std::vector<int> classId; int validCount = 0; int stride = 0; int grid_h = 0; int grid_w = 0; int model_in_w = app_ctx->model_width; int model_in_h = app_ctx->model_height; memset(od_results, 0, sizeof(object_detect_result_list)); int index = 0;
// 处理三个输出层 for (int i = 0; i < 3; i++) { grid_h = app_ctx->output_attrs[i].dims[2]; grid_w = app_ctx->output_attrs[i].dims[3]; stride = model_in_h / grid_h; if (app_ctx->is_quant) { validCount += process_i8((int8_t *)outputs[i].buf, grid_h, grid_w, stride, filterBoxes, objProbs, classId, conf_threshold, app_ctx->output_attrs[i].zp, app_ctx->output_attrs[i].scale,index); } else { validCount += process_fp32((float *)outputs[i].buf, grid_h, grid_w, stride, filterBoxes, objProbs, classId, conf_threshold, app_ctx->output_attrs[i].zp, app_ctx->output_attrs[i].scale, index); } index += grid_h * grid_w; }
// no object detect if (validCount <= 0) { return 0; } std::vector<int> indexArray; for (int i = 0; i < validCount; ++i) { indexArray.push_back(i); } quick_sort_indice_inverse(objProbs, 0, validCount - 1, indexArray);
std::set<int> class_set(std::begin(classId), std::end(classId));
for (auto c : class_set) { nms(validCount, filterBoxes, classId, indexArray, c, nms_threshold); }
int last_count = 0; od_results->count = 0;
/* box valid detect target */ for (int i = 0; i < validCount; ++i) { if (indexArray[i] == -1 || last_count >= OBJ_NUMB_MAX_SIZE) { continue; } int n = indexArray[i]; float x1 = filterBoxes[n * 5 + 0] - letter_box->x_pad; float y1 = filterBoxes[n * 5 + 1] - letter_box->y_pad; float w = filterBoxes[n * 5 + 2]; float h = filterBoxes[n * 5 + 3]; // if (n * 5 + 4 >= filterBoxes.size()) { // fprintf(stderr, "filterBoxes access out of bound\n"); // return -1; // } int keypoints_index = (int)filterBoxes[n * 5 + 4];
// if (outputs[3].buf == nullptr) { // fprintf(stderr, "Error: outputs[3] is not available or buffer is NULL\n"); // return -1; // }
for (int j = 0; j < 17; ++j) { // if (outputs[i].buf == nullptr) { // fprintf(stderr, "Error: outputs[%d].buf is NULL\n", i); // return -1; // } if (app_ctx->is_quant) { od_results->results[last_count].keypoints[j][0] = ((float)((rknpu2::float16 *)outputs[3].buf)[j*3*8400+0*8400+keypoints_index] - letter_box->x_pad)/ letter_box->scale; od_results->results[last_count].keypoints[j][1] = ((float)((rknpu2::float16 *)outputs[3].buf)[j*3*8400+1*8400+keypoints_index] - letter_box->y_pad)/ letter_box->scale; od_results->results[last_count].keypoints[j][2] = (float)((rknpu2::float16 *)outputs[3].buf)[j*3*8400+2*8400+keypoints_index]; } else { od_results->results[last_count].keypoints[j][0] = (((float *)outputs[3].buf)[j*3*8400+0*8400+keypoints_index] - letter_box->x_pad)/ letter_box->scale; od_results->results[last_count].keypoints[j][1] = (((float *)outputs[3].buf)[j*3*8400+1*8400+keypoints_index] - letter_box->y_pad)/ letter_box->scale; od_results->results[last_count].keypoints[j][2] = ((float *)outputs[3].buf)[j*3*8400+2*8400+keypoints_index]; } }
int id = classId[n]; float obj_conf = objProbs[i]; od_results->results[last_count].box.left = (int)(clamp(x1, 0, model_in_w) / letter_box->scale); od_results->results[last_count].box.top = (int)(clamp(y1, 0, model_in_h) / letter_box->scale); od_results->results[last_count].box.right = (int)(clamp(x1+w, 0, model_in_w) / letter_box->scale); od_results->results[last_count].box.bottom = (int)(clamp(y1+h, 0, model_in_h) / letter_box->scale); // od_results->results[last_count].box.angle = angle; od_results->results[last_count].prop = obj_conf; od_results->results[last_count].cls_id = id; last_count++; } od_results->count = last_count; return 0;}
int init_post_process() { int ret = 0; ret = loadLabelName(LABEL_NALE_TXT_PATH, labels); if (ret < 0) { printf("Load %s failed!\n", LABEL_NALE_TXT_PATH); return -1; } return 0;}
char *coco_cls_to_name(int cls_id) {
if (cls_id >= OBJ_CLASS_NUM) { return "null"; }
if (labels[cls_id]) { return labels[cls_id]; }
return "null";}
void deinit_post_process() { for (int i = 0; i < OBJ_CLASS_NUM; i++) { if (labels[i] != nullptr) { free(labels[i]); labels[i] = nullptr; } }}4、参考链接:
支持与分享
如果这篇文章对你有帮助,欢迎分享给更多人或打赏支持!
Yolo_Pose姿态模型在arm linux的验证与部署
https://firefly.cuteleaf.cn/posts/obsidian/yolo-pose姿态模型在arm-linux的验证与部署/ 相关文章 智能推荐
1
Yolo模型转换
AI 以下都以yolo的姿态检测模型为例 1、准备需要用的程序 第一个工程:rknn toolkit2, 用于安装模型转换所需环境 ,github地址:https://github.com/airockchip/rknn toolkit2/releases 第二个工程:ultralyt
2
Redis在Linux下安装教程
运维部署 Redis安装 1、首先准备REDIS安装包 这里下载的是 redis 5.0.8.tar.gz 安装包,并将其直接放在了 root 目录下 2、解压安装包 在 /usr/local/ 下创建 redis 文件夹并进入 将 Redis 安装包解压到 /usr/local/redi
3
图像增强库Albumentations使用
AI 参考链接: https://blog.csdn.net/hhhhhhhhhhwwwwwwwwww/article/details/116460996
4
Mxnet-GPU-102版本安装
AI 1、安装10.2版本的CUDA硬件加速环境 本blog的安装教程的跳转连接:https://blog.cherrylord.cn/article/post 29 2、创建conda虚拟环境 要创建的环境的python版本需要3.7.13的版本 3、直接安装mxnet cu102的
5
yolov8蒸馏训练
AI 1、分别训练学生模型和教师模型 这里用的是yolov8x.pt为权重训练教师模型,yolov8s.pt作为学生模型 2、蒸馏训练 参考链接: https://blog.csdn.net/W extend/article/details/140902235?spm=1001.201
随机文章 随机推荐