// Tencent is pleased to support the open source community by making ncnn available. // // Copyright (C) 2024 THL A29 Limited, a Tencent company. All rights reserved. // // Licensed under the BSD 3-Clause License (the "License"); you may not use this file except // in compliance with the License. You may obtain a copy of the License at // // https://opensource.org/licenses/BSD-3-Clause // // Unless required by applicable law or agreed to in writing, software distributed // under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR // CONDITIONS OF ANY KIND, either express or implied. See the License for the // specific language governing permissions and limitations under the License. // 1. install // pip3 install -U ultralytics pnnx ncnn // 2. export yolov8-seg torchscript // yolo export model=yolov8n-seg.pt format=torchscript // 3. convert torchscript with static shape // pnnx yolov8n-seg.torchscript // 4. modify yolov8n_seg_pnnx.py for dynamic shape inference // A. modify reshape to support dynamic image sizes // B. permute tensor before concat and adjust concat axis // C. drop post-process part // before: // v_144 = v_143.view(1, 32, 6400) // v_150 = v_149.view(1, 32, 1600) // v_156 = v_155.view(1, 32, 400) // v_157 = torch.cat((v_144, v_150, v_156), dim=2) // ... // v_191 = v_168.view(1, 144, 6400) // v_192 = v_179.view(1, 144, 1600) // v_193 = v_190.view(1, 144, 400) // v_194 = torch.cat((v_191, v_192, v_193), dim=2) // ... // v_215 = (v_214, v_138, ) // return v_215 // after: // v_144 = v_143.view(1, 32, -1).transpose(1, 2) // v_150 = v_149.view(1, 32, -1).transpose(1, 2) // v_156 = v_155.view(1, 32, -1).transpose(1, 2) // v_157 = torch.cat((v_144, v_150, v_156), dim=1) // ... // v_191 = v_168.view(1, 144, -1).transpose(1, 2) // v_192 = v_179.view(1, 144, -1).transpose(1, 2) // v_193 = v_190.view(1, 144, -1).transpose(1, 2) // v_194 = torch.cat((v_191, v_192, v_193), dim=1) // return v_194, v_157, v_138 // 5. re-export yolov8-seg torchscript // python3 -c 'import yolov8n_seg_pnnx; yolov8n_seg_pnnx.export_torchscript()' // 6. convert new torchscript with dynamic shape // pnnx yolov8n_seg_pnnx.py.pt inputshape=[1,3,640,640] inputshape2=[1,3,320,320] // 7. now you get ncnn model files // mv yolov8n_seg_pnnx.py.ncnn.param yolov8n_seg.ncnn.param // mv yolov8n_seg_pnnx.py.ncnn.bin yolov8n_seg.ncnn.bin // the out blob would be a 2-dim tensor with w=176 h=8400 // // | bbox-reg 16 x 4 | per-class scores(80) | // +-----+-----+-----+-----+----------------------+ // | dx0 | dy0 | dx1 | dy1 |0.1 0.0 0.0 0.5 ......| // all /| | | | | . | // boxes | .. | .. | .. | .. |0.0 0.9 0.0 0.0 ......| // (8400)| | | | | . | // \| | | | | . | // +-----+-----+-----+-----+----------------------+ // // // | mask (32) | // +-----------+ // |0.1........| // all /| | // boxes |0.0........| // (8400)| . | // \| . | // +-----------+ // #include "layer.h" #include "net.h" #if defined(USE_NCNN_SIMPLEOCV) #include "simpleocv.h" #else #include #include #include #endif #include #include #include struct Object { cv::Rect_ rect; int label; float prob; int gindex; cv::Mat mask; }; static inline float intersection_area(const Object& a, const Object& b) { cv::Rect_ inter = a.rect & b.rect; return inter.area(); } static void qsort_descent_inplace(std::vector