diff options
author | Stanislaw Halik <sthalik@misaki.pl> | 2017-04-18 08:04:12 +0200 |
---|---|---|
committer | Stanislaw Halik <sthalik@misaki.pl> | 2017-04-18 08:04:12 +0200 |
commit | 39acca95501fa7b0d77f8e6d2cbf97f45cff4ebf (patch) | |
tree | e9920d53b63a7796e4b8d3f23c7afb377d9e0103 | |
parent | 068064dfe6a51ea86757b4cc664f048fb16486e8 (diff) |
tracker/pt: revert extractor change
-rw-r--r-- | tracker-pt/point_extractor.cpp | 170 | ||||
-rw-r--r-- | tracker-pt/point_extractor.h | 6 |
2 files changed, 113 insertions, 63 deletions
diff --git a/tracker-pt/point_extractor.cpp b/tracker-pt/point_extractor.cpp index 2473ebc3..4bd92d44 100644 --- a/tracker-pt/point_extractor.cpp +++ b/tracker-pt/point_extractor.cpp @@ -37,24 +37,26 @@ corresponding location is a good candidate for the extracted point. The idea similar to the window scaling suggested in Berglund et al. "Fast, bias-free algorithm for tracking single particles with variable size and shape." (2008). */ -static cv::Vec2d MeanShiftIteration(const cv::Mat& frame_gray, const cv::Vec2d& current_center, double filter_width) +static cv::Vec2d MeanShiftIteration(const cv::Mat &frame_gray, const cv::Vec2d ¤t_center, double filter_width) { // Most amazingling this function runs faster with doubles than with floats. const double s = 1.0 / filter_width; double m = 0; cv::Vec2d com(0.0, 0.0); - const int h = frame_gray.rows, w = frame_gray.cols; - for (int i = 0; i < h; i++) + for (int i = 0; i < frame_gray.rows; i++) { - auto frame_ptr = (const unsigned char* OTR_RESTRICT)frame_gray.ptr(i); - for (int j = 0; j < w; j++) + auto frame_ptr = (uint8_t *)frame_gray.ptr(i); + for (int j = 0; j < frame_gray.cols; j++) { double val = frame_ptr[j]; - double dx = (j - current_center[0])*s; - double dy = (i - current_center[1])*s; - double f = std::max(0.0, 1.0 - dx*dx - dy*dy); - val *= f; + val = val * val; // taking the square wights brighter parts of the image stronger. + { + double dx = (j - current_center[0])*s; + double dy = (i - current_center[1])*s; + double f = std::max(0.0, 1.0 - dx*dx - dy*dy); + val *= f; + } m += val; com[0] += j * val; com[1] += i * val; @@ -68,7 +70,6 @@ static cv::Vec2d MeanShiftIteration(const cv::Mat& frame_gray, const cv::Vec2d& else return current_center; } -// End of mean shift code. At this point, blob positions are updated which hopefully less noisy less biased values. PointExtractor::PointExtractor() { @@ -114,7 +115,7 @@ void PointExtractor::extract_points(const cv::Mat& frame, cv::Mat& preview_frame static constexpr double max_radius = 15; const double radius = max(0., (max_radius-min_radius) * s.threshold / 255 + min_radius); - const float* ptr = reinterpret_cast<const float* OTR_RESTRICT>(hist.ptr(0)); + const float* ptr = reinterpret_cast<const float*>(hist.ptr(0)); const unsigned area = unsigned(round(3 * M_PI * radius*radius)); const unsigned sz = unsigned(hist.cols * hist.rows); unsigned thres = 1; @@ -137,11 +138,10 @@ void PointExtractor::extract_points(const cv::Mat& frame, cv::Mat& preview_frame frame_bin.copyTo(frame_blobs); unsigned idx = 0; - const int h = frame_blobs.rows, w = frame_blobs.cols; - for (int y=0; y < h; y++) + for (int y=0; y < frame_blobs.rows; y++) { - const unsigned char* OTR_RESTRICT ptr_bin = frame_blobs.ptr(y); - for (int x=0; x < w; x++) + const unsigned char* ptr_bin = frame_blobs.ptr(y); + for (int x=0; x < frame_blobs.cols; x++) { if (ptr_bin[x] != 255) continue; @@ -153,20 +153,87 @@ void PointExtractor::extract_points(const cv::Mat& frame, cv::Mat& preview_frame cv::Scalar(idx), &rect, cv::Scalar(0), - cv::Scalar(0)); - - const double radius = sqrt(rect.width * rect.height / M_PI); - if (radius > region_size_max || radius < region_size_min) - continue; + cv::Scalar(0), + 8); - blobs.push_back(blob { radius, cv::Vec2d(rect.x/* + rect.width/2.*/, rect.y/* + rect.height/2.*/), rect }); + // these are doubles since m10 and m01 could overflow theoretically + // log2(255^2 * 640^2 * pi) > 36 + double m10 = 0; + double m01 = 0; + // norm can't overflow since there's no 640^2 component + int norm = 0; + int cnt = 0; - if (idx >= max_blobs) goto end; + for (int i=rect.y; i < (rect.y+rect.height); i++) + { + unsigned char* ptr_blobs = frame_blobs.ptr(i); + const unsigned char* ptr_gray = frame_gray.ptr(i); + for (int j=rect.x; j < (rect.x+rect.width); j++) + { + if (ptr_blobs[j] != idx) + continue; + + ptr_blobs[j] = 0; + + // square as a weight gives better results + const int val(int(ptr_gray[j]) * int(ptr_gray[j])); + + norm += val; + m01 += i * val; + m10 += j * val; + cnt++; + } + } + if (norm > 0) + { + const double radius = sqrt(cnt / M_PI), N = double(norm); + if (radius > region_size_max || radius < region_size_min) + continue; + + blob b(radius, cv::Vec2d(m10 / N, m01 / N), N/sqrt(double(cnt)), rect); + blobs.push_back(b); + + { + static const f offx = 10, offy = 7.5; + const f cx = preview_frame.cols / f(frame.cols), + cy = preview_frame.rows / f(frame.rows); + cv::Point p(iround(b.pos[0] * cx), iround(b.pos[1] * cy)); + + static const cv::Scalar color(0, 255, 0); + + cv::circle(preview_frame, p, b.radius, color); + + { + const int len = iround(b.radius * 1.25) + 1; + cv::line(preview_frame, + cv::Point(p.x - len, p.y), + cv::Point(p.x + len, p.y), + color); + cv::line(preview_frame, + cv::Point(p.x, p.y - len), + cv::Point(p.x, p.y + len), + color); + } + + char buf[64]; + sprintf(buf, "%.2fpx", radius); + + cv::putText(preview_frame, + buf, + cv::Point(iround(b.pos[0]*cx+offx), iround(b.pos[1]*cy+offy)), + cv::FONT_HERSHEY_PLAIN, + 1, + cv::Scalar(0, 0, 255), + 1); + } + + if (idx >= max_blobs) goto end; + } } } end: - sort(blobs.begin(), blobs.end(), [](const blob& b1, const blob& b2) { return b2.radius < b1.radius; }); + sort(blobs.begin(), blobs.end(), [](const blob& b1, const blob& b2) -> bool { return b2.brightness < b1.brightness; }); const int W = frame.cols; const int H = frame.rows; @@ -176,59 +243,35 @@ end: blob &b = blobs[idx]; cv::Rect rect = b.rect; + rect.x -= rect.width / 2; + rect.y -= rect.height / 2; + rect.width *= 2; + rect.height *= 2; + rect &= cv::Rect(0, 0, W, H); // crop at frame boundaries + cv::Mat frame_roi = frame_gray(rect); - static constexpr double radius_c = 2; + // smaller values mean more changes. 1 makes too many changes while 1.5 makes about .1 + // seems values close to 1.3 reduce noise best with about .15->.2 changes + static constexpr double radius_c = 1.3; const double kernel_radius = b.radius * radius_c; cv::Vec2d pos(b.pos[0] - rect.x, b.pos[1] - rect.y); // position relative to ROI. - int iter; (void)iter; - for (iter = 0; iter < 10; ++iter) + for (int iter = 0; iter < 10; ++iter) { - cv::Vec2d com_new = MeanShiftIteration(frame_roi, com_new, kernel_radius); + cv::Vec2d com_new = MeanShiftIteration(frame_roi, pos, kernel_radius); cv::Vec2d delta = com_new - pos; pos = com_new; if (delta.dot(delta) < 1e-3) break; } - b.pos = cv::Vec2d(pos[0] + rect.x, pos[1] + rect.y); - - { - static const f offx = 10, offy = 7.5; - const f cx = preview_frame.cols / f(frame.cols), - cy = preview_frame.rows / f(frame.rows), - c = .5*(cx+cy); - cv::Point p(iround(b.pos[0] * cx), iround(b.pos[1] * cy)); - - static const cv::Scalar color(0, 255, 0); - - { - const int len = iround(b.radius * c * 1.1) + 1; - cv::line(preview_frame, - cv::Point(p.x - len, p.y), - cv::Point(p.x + len, p.y), - color); - cv::line(preview_frame, - cv::Point(p.x, p.y - len), - cv::Point(p.x, p.y + len), - color); - } - - char buf[32]; - sprintf(buf, "%.2fpx", b.radius); - - cv::putText(preview_frame, - buf, - cv::Point(iround(b.pos[0]*cx+offx), iround(b.pos[1]*cy+offy)), - cv::FONT_HERSHEY_PLAIN, - 1, - cv::Scalar(0, 0, 255), - 1); - } + b.pos[0] = pos[0] + rect.x; + b.pos[1] = pos[1] + rect.y; } + // End of mean shift code. At this point, blob positions are updated which hopefully less noisy less biased values. points.reserve(max_blobs); points.clear(); @@ -241,3 +284,8 @@ end: } } +PointExtractor::blob::blob(double radius, const cv::Vec2d& pos, double brightness, cv::Rect& rect) : + radius(radius), brightness(brightness), pos(pos), rect(rect) +{ + //qDebug() << "radius" << radius << "pos" << pos[0] << pos[1]; +} diff --git a/tracker-pt/point_extractor.h b/tracker-pt/point_extractor.h index 3c0b76d8..f931edd5 100644 --- a/tracker-pt/point_extractor.h +++ b/tracker-pt/point_extractor.h @@ -38,11 +38,13 @@ private: cv::Mat hist; cv::Mat frame_blobs; - struct blob final + struct blob { - double radius; + double radius, brightness; vec2 pos; cv::Rect rect; + + blob(double radius, const cv::Vec2d& pos, double brightness, cv::Rect &rect); }; std::vector<blob> blobs; |