forked from OAID/Tengine
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdetection_postprocess.c
128 lines (107 loc) · 4.44 KB
/
detection_postprocess.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* License); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* AS IS BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
/*
* Copyright (c) 2020, OPEN AI LAB
* Author: [email protected]
*/
#include <stdio.h>
#include <assert.h>
#include "sys_port.h"
#include "tengine_ir.h"
#include "tengine_errno.h"
#include "tengine_log.h"
#include "tengine_op.h"
#include "parameter.h"
#include "detection_postprocess_param.h"
DEFINE_PARM_PARSE_ENTRY(detection_postprocess_param, max_detections, max_classes_per_detection, nms_score_threshold,
nms_iou_threshold, num_classes, scales);
static int infer_shape(struct ir_node* node)
{
struct ir_graph* ir_graph = node->graph;
struct ir_tensor* input0 = get_ir_graph_tensor(ir_graph, node->input_tensors[0]);
struct ir_tensor* input1 = get_ir_graph_tensor(ir_graph, node->input_tensors[1]);
struct ir_tensor* output0 = get_ir_graph_tensor(ir_graph, node->output_tensors[0]);
struct ir_tensor* output1 = get_ir_graph_tensor(ir_graph, node->output_tensors[1]);
struct ir_tensor* output2 = get_ir_graph_tensor(ir_graph, node->output_tensors[2]);
struct ir_tensor* output3 = get_ir_graph_tensor(ir_graph, node->output_tensors[3]);
struct detection_postprocess_param* detection_postprocess_param =
( struct detection_postprocess_param* )(node->op.param_mem);
int max_detections = detection_postprocess_param->max_detections;
int max_classes_per_detection = detection_postprocess_param->max_classes_per_detection;
int num_classes = detection_postprocess_param->num_classes;
int num_detected_boxes = max_detections * max_classes_per_detection;
int* in_dim1 = &input0->dims[MAX_SHAPE_DIM_NUM];
int* in_dim2 = &input1->dims[MAX_SHAPE_DIM_NUM];
// Only support: batch_size == 1 && num_coord == 4
if (input0->dims[0] != 1 || input0->dims[1] != 4 || input1->dims[0] != 1 || input1->dims[2] != input0->dims[2] ||
input1->dims[1] != num_classes + 1)
{
fprintf(stderr, "Not Support.\n");
return -1;
}
int dim0[4] = {1, 4, num_detected_boxes};
int dim1[2] = {1, num_detected_boxes};
int dim2[2] = {1, num_detected_boxes};
int dim3[1] = {1};
set_ir_tensor_shape(output0, dim0, 3);
set_ir_tensor_shape(output1, dim1, 2);
set_ir_tensor_shape(output2, dim2, 2);
set_ir_tensor_shape(output3, dim3, 1);
return 0;
}
static int init_op(struct ir_op* op)
{
struct detection_postprocess_param* detection_postprocess_param =
( struct detection_postprocess_param* )sys_malloc(sizeof(struct detection_postprocess_param));
if (detection_postprocess_param == NULL)
{
set_tengine_errno(ENOMEM);
return -1;
}
detection_postprocess_param->scales = NULL;
op->param_mem = detection_postprocess_param;
op->param_size = sizeof(struct detection_postprocess_param);
op->same_shape = 0;
op->infer_shape = infer_shape;
return 0;
}
static void release_op(struct ir_op* op)
{
struct detection_postprocess_param* detection_postprocess_param =
( struct detection_postprocess_param* )op->param_mem;
if (detection_postprocess_param->scales)
sys_free(detection_postprocess_param->scales);
sys_free(op->param_mem);
}
static int register_detection_postprocess_op(void* arg)
{
struct op_method m;
m.op_version = 1;
m.init_op = init_op;
m.release_op = release_op;
m.access_param_entry = access_param_entry;
return register_op(OP_DETECTION_POSTPROCESS, OP_DETECTION_POSTPROCESS_NAME, &m);
}
static int unregister_detection_postprocess_op(void* arg)
{
sys_free(GET_PARAM_PARSE_MAP(detection_postprocess_param));
return unregister_op(OP_DETECTION_POSTPROCESS, 1);
}
AUTO_REGISTER_OP(register_detection_postprocess_op);
AUTO_UNREGISTER_OP(unregister_detection_postprocess_op);