|
- // Tencent is pleased to support the open source community by making ncnn available.
- //
- // Copyright (C) 2017 THL A29 Limited, a Tencent company. All rights reserved.
- //
- // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
- // in compliance with the License. You may obtain a copy of the License at
- //
- // https://opensource.org/licenses/BSD-3-Clause
- //
- // Unless required by applicable law or agreed to in writing, software distributed
- // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
- // CONDITIONS OF ANY KIND, either express or implied. See the License for the
- // specific language governing permissions and limitations under the License.
-
- #include <stdio.h>
- #include <algorithm>
- #include <vector>
- #include <opencv2/core/core.hpp>
- #include <opencv2/highgui/highgui.hpp>
- #include <opencv2/imgproc/imgproc.hpp>
- #include <iostream>
-
- #include "net.h"
-
- struct Object{
- cv::Rect rec;
- int class_id;
- float prob;
- };
-
- const char* class_names[] = {"background",
- "aeroplane", "bicycle", "bird", "boat",
- "bottle", "bus", "car", "cat", "chair",
- "cow", "diningtable", "dog", "horse",
- "motorbike", "person", "pottedplant",
- "sheep", "sofa", "train", "tvmonitor"};
-
- static int detect_mobilenet(cv::Mat& raw_img, float show_threshold)
- {
- ncnn::Net mobilenet;
- /*
- * model is converted from https://github.com/chuanqi305/MobileNet-SSD
- * and can be downloaded from https://drive.google.com/open?id=0ByaKLD9QaPtucWk0Y0dha1VVY0U
- */
- int img_h = raw_img.size().height;
- int img_w = raw_img.size().width;
- mobilenet.load_param("mobilenet_ssd_voc_ncnn.param");
- mobilenet.load_model("mobilenet_ssd_voc_ncnn.bin");
- int input_size = 300;
- ncnn::Mat in = ncnn::Mat::from_pixels_resize(raw_img.data, ncnn::Mat::PIXEL_BGR, raw_img.cols, raw_img.rows, input_size, input_size);
-
- const float mean_vals[3] = {127.5f, 127.5f, 127.5f};
- const float norm_vals[3] = {1.0/127.5,1.0/127.5,1.0/127.5};
- in.substract_mean_normalize(mean_vals, norm_vals);
-
- ncnn::Mat out;
-
- ncnn::Extractor ex = mobilenet.create_extractor();
- ex.set_light_mode(true);
- //ex.set_num_threads(4);
- ex.input("data", in);
- ex.extract("detection_out",out);
-
-
- printf("%d %d %d\n", out.w, out.h, out.c);
- std::vector<Object> objects;
- for (int iw=0;iw<out.h;iw++)
- {
- Object object;
- const float *values = out.row(iw);
- object.class_id = values[0];
- object.prob = values[1];
- object.rec.x = values[2] * img_w;
- object.rec.y = values[3] * img_h;
- object.rec.width = values[4] * img_w - object.rec.x;
- object.rec.height = values[5] * img_h - object.rec.y;
- objects.push_back(object);
- }
-
- for(int i = 0;i<objects.size();++i)
- {
- Object object = objects.at(i);
- if(object.prob > show_threshold)
- {
- cv::rectangle(raw_img, object.rec, cv::Scalar(255, 0, 0));
- std::ostringstream pro_str;
- pro_str<<object.prob;
- std::string label = std::string(class_names[object.class_id]) + ": " + pro_str.str();
- int baseLine = 0;
- cv::Size label_size = cv::getTextSize(label, cv::FONT_HERSHEY_SIMPLEX, 0.5, 1, &baseLine);
- cv::rectangle(raw_img, cv::Rect(cv::Point(object.rec.x, object.rec.y- label_size.height),
- cv::Size(label_size.width, label_size.height + baseLine)),
- cv::Scalar(255, 255, 255), CV_FILLED);
- cv::putText(raw_img, label, cv::Point(object.rec.x, object.rec.y),
- cv::FONT_HERSHEY_SIMPLEX, 0.5, cv::Scalar(0, 0, 0));
- }
- }
- cv::imshow("result",raw_img);
- cv::waitKey();
-
- return 0;
- }
-
- int main(int argc, char** argv)
- {
- const char* imagepath = argv[1];
-
- cv::Mat m = cv::imread(imagepath, CV_LOAD_IMAGE_COLOR);
- if (m.empty())
- {
- fprintf(stderr, "cv::imread %s failed\n", imagepath);
- return -1;
- }
-
- detect_mobilenet(m,0.5);
-
- return 0;
- }
|