//主要对图片进行预处理,包括resize和归一化
std::vector<float> Detector::prepareImage(cv::Mat &src_img){
std::vector<float> result(INPUT_W * INPUT_H * 3);
float *data = result.data();
float ratio = float(INPUT_W) / float(src_img.cols) < float(INPUT_H) / float(src_img.rows) ? float(INPUT_W) / float(src_img.cols) : float(INPUT_H) / float(src_img.rows);
cv::Mat flt_img = cv::Mat::zeros(cv::Size(INPUT_W, INPUT_H), CV_8UC3);
cv::Mat rsz_img = cv::Mat::zeros(cv::Size(src_img.cols*ratio, src_img.rows*ratio), CV_8UC3);
cv::resize(src_img, rsz_img, cv::Size(), ratio, ratio);
rsz_img.copyTo(flt_img(cv::Rect(0, 0, rsz_img.cols, rsz_img.rows)));
flt_img.convertTo(flt_img, CV_32FC3);
int channelLength = INPUT_W * INPUT_H;
std::vector<cv::Mat> split_img = {
cv::Mat(INPUT_W, INPUT_H, CV_32FC1, data + channelLength * 2),
cv::Mat(INPUT_W, INPUT_H, CV_32FC1, data + channelLength),
cv::Mat(INPUT_W, INPUT_H, CV_32FC1, data)
};
cv::split(flt_img, split_img);
for (int i = 0; i < 3; i++) {
split_img[i] = (split_img[i] - img_mean[i]) / img_std[i];
}
return result;
}
//加载IR模型,初始化网络
bool Detector::init(string xml_path,double cof_threshold,double nms_area_threshold,int input_w, int input_h, int num_class, int r_rows, int r_cols, std::vector<int> s, std::vector<float> i_mean,std::vector<float> i_std){
_xml_path = xml_path;
_cof_threshold = cof_threshold;
_nms_area_threshold = nms_area_threshold;
INPUT_W = input_w;
INPUT_H = input_h;
NUM_CLASS = num_class;
refer_rows = r_rows;
refer_cols = r_cols;
strides = s;
img_mean = i_mean;
img_std = i_std;
Core ie;
auto cnnNetwork = ie.ReadNetwork(_xml_path);
InputsDataMap inputInfo(cnnNetwork.getInputsInfo());
InputInfo::Ptr& input = inputInfo.begin()->second;
_input_name = inputInfo.begin()->first;
input->setPrecision(Precision::FP32);
input->getInputData()->setLayout(Layout::NCHW);
ICNNNetwork::InputShapes inputShapes = cnnNetwork.getInputShapes();
SizeVector& inSizeVector = inputShapes.begin()->second;
cnnNetwork.reshape(inputShapes);
_outputinfo = OutputsDataMap(cnnNetwork.getOutputsInfo());
for (auto &output : _outputinfo) {
output.second->setPrecision(Precision::FP32);
}
_network = ie.LoadNetwork(cnnNetwork, "CPU");
return true;
}
//模型推理及获取输出结果
vector<Detector::Bbox> Detector::process_frame(Mat& inframe){
cv::Mat showImage = inframe.clone();
std::vector<float> pr_img = prepareImage(inframe);
InferRequest::Ptr infer_request = _network.CreateInferRequestPtr();
Blob::Ptr frameBlob = infer_request->GetBlob(_input_name);
InferenceEngine::LockedMemory<void> blobMapped = InferenceEngine::as<InferenceEngine::MemoryBlob>(frameBlob)->wmap();
float* blob_data = blobMapped.as<float*>();
memcpy(blob_data, pr_img.data(), 3 * INPUT_H * INPUT_W * sizeof(float));
infer_request->Infer();
vector<Rect> origin_rect;
vector<float> origin_rect_cof;
int i=0;
vector<Bbox> bboxes;
for (auto &output : _outputinfo) {
auto output_name = output.first;
Blob::Ptr blob = infer_request->GetBlob(output_name);
LockedMemory<const void> blobMapped = as<MemoryBlob>(blob)->rmap();
float *output_blob = blobMapped.as<float *>();
bboxes = postProcess(showImage,output_blob);
++i;
}
return bboxes;
}
//对模型输出结果进行解码及nms
std::vector<Detector::Bbox> Detector::postProcess(const cv::Mat &src_img,
float *output) {
GenerateReferMatrix();
std::vector<Detector::Bbox> result;
float *out = output;
float ratio = std::max(float(src_img.cols) / float(INPUT_W), float(src_img.rows) / float(INPUT_H));
cv::Mat result_matrix = cv::Mat(refer_rows, NUM_CLASS + 4, CV_32FC1, out);
for (int row_num = 0; row_num < refer_rows; row_num++) {
Detector::Bbox box;
auto *row = result_matrix.ptr<float>(row_num);
auto max_pos = std::max_element(row + 4, row + NUM_CLASS + 4);
box.prob = row[max_pos - row];
if (box.prob < _cof_threshold)
continue;
box.classes = max_pos - row - 4;
auto *anchor = refer_matrix.ptr<float>(row_num);
box.x = (anchor[0] - row[0] * anchor[2] + anchor[0] + row[2] * anchor[2]) / 2 * ratio;
box.y = (anchor[1] - row[1] * anchor[2] + anchor[1] + row[3] * anchor[2]) / 2 * ratio;
box.w = (row[2] + row[0]) * anchor[2] * ratio;
box.h = (row[3] + row[1]) * anchor[2] * ratio;
result.push_back(box);
}
NmsDetect(result);
return result;
}//主要对图片进行预处理,包括resize和归一化
std::vector<float> Detector::prepareImage(cv::Mat &src_img){
std::vector<float> result(INPUT_W * INPUT_H * 3);
float *data = result.data();
float ratio = float(INPUT_W) / float(src_img.cols) < float(INPUT_H) / float(src_img.rows) ? float(INPUT_W) / float(src_img.cols) : float(INPUT_H) / float(src_img.rows);
cv::Mat flt_img = cv::Mat::zeros(cv::Size(INPUT_W, INPUT_H), CV_8UC3);
cv::Mat rsz_img = cv::Mat::zeros(cv::Size(src_img.cols*ratio, src_img.rows*ratio), CV_8UC3);
cv::resize(src_img, rsz_img, cv::Size(), ratio, ratio);
rsz_img.copyTo(flt_img(cv::Rect(0, 0, rsz_img.cols, rsz_img.rows)));
flt_img.convertTo(flt_img, CV_32FC3);
int channelLength = INPUT_W * INPUT_H;
std::vector<cv::Mat> split_img = {
cv::Mat(INPUT_W, INPUT_H, CV_32FC1, data + channelLength * 2),
cv::Mat(INPUT_W, INPUT_H, CV_32FC1, data + channelLength),
cv::Mat(INPUT_W, INPUT_H, CV_32FC1, data)
};
cv::split(flt_img, split_img);
for (int i = 0; i < 3; i++) {
split_img[i] = (split_img[i] - img_mean[i]) / img_std[i];
}
return result;
}
//加载IR模型,初始化网络
bool Detector::init(string xml_path,double cof_threshold,double nms_area_threshold,int input_w, int input_h, int num_class, int r_rows, int r_cols, std::vector<int> s, std::vector<float> i_mean,std::vector<float> i_std){
_xml_path = xml_path;
_cof_threshold = cof_threshold;
_nms_area_threshold = nms_area_threshold;
INPUT_W = input_w;
INPUT_H = input_h;
NUM_CLASS = num_class;
refer_rows = r_rows;
refer_cols = r_cols;
strides = s;
img_mean = i_mean;
img_std = i_std;
Core ie;
auto cnnNetwork = ie.ReadNetwork(_xml_path);
InputsDataMap inputInfo(cnnNetwork.getInputsInfo());
InputInfo::Ptr& input = inputInfo.begin()->second;
_input_name = inputInfo.begin()->first;
input->setPrecision(Precision::FP32);
input->getInputData()->setLayout(Layout::NCHW);
ICNNNetwork::InputShapes inputShapes = cnnNetwork.getInputShapes();
SizeVector& inSizeVector = inputShapes.begin()->second;
cnnNetwork.reshape(inputShapes);
_outputinfo = OutputsDataMap(cnnNetwork.getOutputsInfo());
for (auto &output : _outputinfo) {
output.second->setPrecision(Precision::FP32);
}
_network = ie.LoadNetwork(cnnNetwork, "CPU");
return true;
}
//模型推理及获取输出结果
vector<Detector::Bbox> Detector::process_frame(Mat& inframe){
cv::Mat showImage = inframe.clone();
std::vector<float> pr_img = prepareImage(inframe);
InferRequest::Ptr infer_request = _network.CreateInferRequestPtr();
Blob::Ptr frameBlob = infer_request->GetBlob(_input_name);
InferenceEngine::LockedMemory<void> blobMapped = InferenceEngine::as<InferenceEngine::MemoryBlob>(frameBlob)->wmap();
float* blob_data = blobMapped.as<float*>();
memcpy(blob_data, pr_img.data(), 3 * INPUT_H * INPUT_W * sizeof(float));
infer_request->Infer();
vector<Rect> origin_rect;
vector<float> origin_rect_cof;
int i=0;
vector<Bbox> bboxes;
for (auto &output : _outputinfo) {
auto output_name = output.first;
Blob::Ptr blob = infer_request->GetBlob(output_name);
LockedMemory<const void> blobMapped = as<MemoryBlob>(blob)->rmap();
float *output_blob = blobMapped.as<float *>();
bboxes = postProcess(showImage,output_blob);
++i;
}
return bboxes;
}
//对模型输出结果进行解码及nms
std::vector<Detector::Bbox> Detector::postProcess(const cv::Mat &src_img,
float *output) {
GenerateReferMatrix();
std::vector<Detector::Bbox> result;
float *out = output;
float ratio = std::max(float(src_img.cols) / float(INPUT_W), float(src_img.rows) / float(INPUT_H));
cv::Mat result_matrix = cv::Mat(refer_rows, NUM_CLASS + 4, CV_32FC1, out);
for (int row_num = 0; row_num < refer_rows; row_num++) {
Detector::Bbox box;
auto *row = result_matrix.ptr<float>(row_num);
auto max_pos = std::max_element(row + 4, row + NUM_CLASS + 4);
box.prob = row[max_pos - row];
if (box.prob < _cof_threshold)
continue;
box.classes = max_pos - row - 4;
auto *anchor = refer_matrix.ptr<float>(row_num);
box.x = (anchor[0] - row[0] * anchor[2] + anchor[0] + row[2] * anchor[2]) / 2 * ratio;
box.y = (anchor[1] - row[1] * anchor[2] + anchor[1] + row[3] * anchor[2]) / 2 * ratio;
box.w = (row[2] + row[0]) * anchor[2] * ratio;
box.h = (row[3] + row[1]) * anchor[2] * ratio;
result.push_back(box);
}
NmsDetect(result);
return result;
}