#include "layer.h" #include "net.h" #if defined(USE_NCNN_SIMPLEOCV) #include "simpleocv.h" #include #else #include #include #include #include #endif #include #include #include #include #include "BYTETracker.h" #define YOLOX_NMS_THRESH 0.7 // nms threshold #define YOLOX_CONF_THRESH 0.1 // threshold of bounding box prob #define INPUT_W 1088 // target image size w after resize #define INPUT_H 608 // target image size h after resize Mat static_resize(Mat& img) { float r = min(INPUT_W / (img.cols*1.0), INPUT_H / (img.rows*1.0)); // r = std::min(r, 1.0f); int unpad_w = r * img.cols; int unpad_h = r * img.rows; Mat re(unpad_h, unpad_w, CV_8UC3); resize(img, re, re.size()); Mat out(INPUT_H, INPUT_W, CV_8UC3, Scalar(114, 114, 114)); re.copyTo(out(Rect(0, 0, re.cols, re.rows))); return out; } // YOLOX use the same focus in yolov5 class YoloV5Focus : public ncnn::Layer { public: YoloV5Focus() { one_blob_only = true; } virtual int forward(const ncnn::Mat& bottom_blob, ncnn::Mat& top_blob, const ncnn::Option& opt) const { int w = bottom_blob.w; int h = bottom_blob.h; int channels = bottom_blob.c; int outw = w / 2; int outh = h / 2; int outc = channels * 4; top_blob.create(outw, outh, outc, 4u, 1, opt.blob_allocator); if (top_blob.empty()) return -100; #pragma omp parallel for num_threads(opt.num_threads) for (int p = 0; p < outc; p++) { const float* ptr = bottom_blob.channel(p % channels).row((p / channels) % 2) + ((p / channels) / 2); float* outptr = top_blob.channel(p); for (int i = 0; i < outh; i++) { for (int j = 0; j < outw; j++) { *outptr = *ptr; outptr += 1; ptr += 2; } ptr += w; } } return 0; } }; DEFINE_LAYER_CREATOR(YoloV5Focus) struct GridAndStride { int grid0; int grid1; int stride; }; static inline float intersection_area(const Object& a, const Object& b) { cv::Rect_ inter = a.rect & b.rect; return inter.area(); } static void qsort_descent_inplace(std::vector