Merge CV, ver=5.1; ops/methods from HV, and interface from CV where possible
[goodguy/history.git] / cinelerra-5.1 / plugins / motion / opencvwrapper.C
diff --git a/cinelerra-5.1/plugins/motion/opencvwrapper.C b/cinelerra-5.1/plugins/motion/opencvwrapper.C
new file mode 100644 (file)
index 0000000..7c19be6
--- /dev/null
@@ -0,0 +1,551 @@
+/*
+ * CINELERRA
+ * Copyright (C) 1997-2012 Adam Williams <broadcast at earthling dot net>
+ * 
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ * 
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ * 
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+ * 
+ */
+
+
+
+#include "opencvwrapper.h"
+#include "vframe.h"
+
+#include "opencv2/calib3d/calib3d.hpp"
+#include "opencv2/objdetect/objdetect.hpp"
+#include "opencv2/features2d/features2d.hpp"
+
+
+#include <iostream>
+#include <vector>
+#include <stdio.h>
+#include <stdlib.h>
+
+
+
+
+using namespace std;
+
+
+// define whether to use approximate nearest-neighbor search
+#define USE_FLANN
+
+// Sizes must be quantized a certain amount for OpenCV
+#define QUANTIZE 8
+
+
+
+double
+compareSURFDescriptors( const float* d1, const float* d2, double best, int length )
+{
+    double total_cost = 0;
+    assert( length % 4 == 0 );
+    for( int i = 0; i < length; i += 4 )
+    {
+        double t0 = d1[i  ] - d2[i  ];
+        double t1 = d1[i+1] - d2[i+1];
+        double t2 = d1[i+2] - d2[i+2];
+        double t3 = d1[i+3] - d2[i+3];
+        total_cost += t0*t0 + t1*t1 + t2*t2 + t3*t3;
+        if( total_cost > best )
+            break;
+    }
+    return total_cost;
+}
+
+
+int
+naiveNearestNeighbor( const float* vec, int laplacian,
+                      const CvSeq* model_keypoints,
+                      const CvSeq* model_descriptors )
+{
+    int length = (int)(model_descriptors->elem_size/sizeof(float));
+    int i, neighbor = -1;
+    double d, dist1 = 1e6, dist2 = 1e6;
+    CvSeqReader reader, kreader;
+    cvStartReadSeq( model_keypoints, &kreader, 0 );
+    cvStartReadSeq( model_descriptors, &reader, 0 );
+
+    for( i = 0; i < model_descriptors->total; i++ )
+    {
+        const CvSURFPoint* kp = (const CvSURFPoint*)kreader.ptr;
+        const float* mvec = (const float*)reader.ptr;
+       CV_NEXT_SEQ_ELEM( kreader.seq->elem_size, kreader );
+        CV_NEXT_SEQ_ELEM( reader.seq->elem_size, reader );
+        if( laplacian != kp->laplacian )
+            continue;
+        d = compareSURFDescriptors( vec, mvec, dist2, length );
+        if( d < dist1 )
+        {
+            dist2 = dist1;
+            dist1 = d;
+            neighbor = i;
+        }
+        else if ( d < dist2 )
+            dist2 = d;
+    }
+    if ( dist1 < 0.6*dist2 )
+        return neighbor;
+    return -1;
+}
+
+void
+findPairs( const CvSeq* objectKeypoints, const CvSeq* objectDescriptors,
+           const CvSeq* imageKeypoints, const CvSeq* imageDescriptors, vector<int>& ptpairs )
+{
+    int i;
+    CvSeqReader reader, kreader;
+    cvStartReadSeq( objectKeypoints, &kreader );
+    cvStartReadSeq( objectDescriptors, &reader );
+    ptpairs.clear();
+
+    for( i = 0; i < objectDescriptors->total; i++ )
+    {
+        const CvSURFPoint* kp = (const CvSURFPoint*)kreader.ptr;
+        const float* descriptor = (const float*)reader.ptr;
+        CV_NEXT_SEQ_ELEM( kreader.seq->elem_size, kreader );
+        CV_NEXT_SEQ_ELEM( reader.seq->elem_size, reader );
+        int nearest_neighbor = naiveNearestNeighbor( descriptor, kp->laplacian, imageKeypoints, imageDescriptors );
+        if( nearest_neighbor >= 0 )
+        {
+            ptpairs.push_back(i);
+            ptpairs.push_back(nearest_neighbor);
+        }
+    }
+}
+
+
+void
+flannFindPairs( const CvSeq*, 
+       const CvSeq* objectDescriptors,
+    const CvSeq*, 
+       const CvSeq* imageDescriptors, 
+       vector<int>& ptpairs )
+{
+       int length = (int)(objectDescriptors->elem_size/sizeof(float));
+
+    cv::Mat m_object(objectDescriptors->total, length, CV_32F);
+       cv::Mat m_image(imageDescriptors->total, length, CV_32F);
+
+
+       // copy descriptors
+    CvSeqReader obj_reader;
+       float* obj_ptr = m_object.ptr<float>(0);
+    cvStartReadSeq( objectDescriptors, &obj_reader );
+    for(int i = 0; i < objectDescriptors->total; i++ )
+    {
+        const float* descriptor = (const float*)obj_reader.ptr;
+        CV_NEXT_SEQ_ELEM( obj_reader.seq->elem_size, obj_reader );
+        memcpy(obj_ptr, descriptor, length*sizeof(float));
+        obj_ptr += length;
+    }
+    CvSeqReader img_reader;
+       float* img_ptr = m_image.ptr<float>(0);
+    cvStartReadSeq( imageDescriptors, &img_reader );
+    for(int i = 0; i < imageDescriptors->total; i++ )
+    {
+        const float* descriptor = (const float*)img_reader.ptr;
+        CV_NEXT_SEQ_ELEM( img_reader.seq->elem_size, img_reader );
+        memcpy(img_ptr, descriptor, length*sizeof(float));
+        img_ptr += length;
+    }
+
+    // find nearest neighbors using FLANN
+    cv::Mat m_indices(objectDescriptors->total, 2, CV_32S);
+    cv::Mat m_dists(objectDescriptors->total, 2, CV_32F);
+    cv::flann::Index flann_index(m_image, cv::flann::KDTreeIndexParams(4));  // using 4 randomized kdtrees
+    flann_index.knnSearch(m_object, m_indices, m_dists, 2, cv::flann::SearchParams(64) ); // maximum number of leafs checked
+
+    int* indices_ptr = m_indices.ptr<int>(0);
+    float* dists_ptr = m_dists.ptr<float>(0);
+//printf("flannFindPairs %d m_indices.rows=%d\n", __LINE__, m_indices.rows);
+    for (int i = 0; i < m_indices.rows; ++i) 
+       {
+//printf("flannFindPairs %d dists=%f %f\n", __LINE__, dists_ptr[2 * i], 0.6 * dists_ptr[2 * i + 1]);
+       if (dists_ptr[2 * i] < 0.6 * dists_ptr[2 * i + 1]) 
+               {
+//printf("flannFindPairs %d pairs=%d\n", __LINE__, ptpairs.size());
+               ptpairs.push_back(i);
+               ptpairs.push_back(indices_ptr[2*i]);
+       }
+    }
+}
+
+
+/* a rough implementation for object location */
+int OpenCVWrapper::locatePlanarObject(const CvSeq* objectKeypoints, 
+       const CvSeq* objectDescriptors,
+    const CvSeq* imageKeypoints, 
+       const CvSeq* imageDescriptors,
+    const CvPoint src_corners[4], 
+       int *(*point_pairs),
+       int (*total_pairs))
+{
+    double h[9];
+    CvMat _h = cvMat(3, 3, CV_64F, h);
+    vector<int> ptpairs;
+    vector<CvPoint2D32f> pt1, pt2;
+    CvMat _pt1, _pt2;
+    int i, n;
+       
+       (*point_pairs) = 0;
+       (*total_pairs) = 0;
+
+#ifdef USE_FLANN
+    flannFindPairs( objectKeypoints, objectDescriptors, imageKeypoints, imageDescriptors, ptpairs );
+#else
+    findPairs( objectKeypoints, objectDescriptors, imageKeypoints, imageDescriptors, ptpairs );
+#endif
+
+
+// Store keypoints
+       (*point_pairs) = (int*)calloc(ptpairs.size(), sizeof(int));
+       (*total_pairs) = ptpairs.size() / 2;
+       
+       
+    for(int i = 0; i < (int)ptpairs.size(); i++)
+    {
+               (*point_pairs)[i] = ptpairs[i];
+    }
+
+
+
+    n = (int)(ptpairs.size()/2);
+    if( n < 4 )
+        return 0;
+
+    pt1.resize(n);
+    pt2.resize(n);
+    for( i = 0; i < n; i++ )
+    {
+        pt1[i] = ((CvSURFPoint*)cvGetSeqElem(objectKeypoints,ptpairs[i*2]))->pt;
+        pt2[i] = ((CvSURFPoint*)cvGetSeqElem(imageKeypoints,ptpairs[i*2+1]))->pt;
+    }
+
+    _pt1 = cvMat(1, n, CV_32FC2, &pt1[0] );
+    _pt2 = cvMat(1, n, CV_32FC2, &pt2[0] );
+    if( !cvFindHomography( &_pt1, &_pt2, &_h, CV_RANSAC, 5 ))
+        return 0;
+
+    for( i = 0; i < 4; i++ )
+    {
+        double x = src_corners[i].x, y = src_corners[i].y;
+        double Z = 1./(h[6]*x + h[7]*y + h[8]);
+        double X = (h[0]*x + h[1]*y + h[2])*Z;
+        double Y = (h[3]*x + h[4]*y + h[5])*Z;
+        dst_corners[i * 2] = X;
+               dst_corners[i * 2 + 1] = Y;
+    }
+
+    return 1;
+}
+
+
+
+
+OpenCVWrapper::OpenCVWrapper()
+{
+       object_image = 0;
+       scene_image = 0;
+       object_image_w = 0;
+       object_image_h = 0;
+       scene_image_w = 0;
+       scene_image_h = 0;
+       storage = 0;
+       object_keypoints = 0;
+       object_descriptors = 0;
+       scene_keypoints = 0;
+       scene_descriptors = 0;
+       point_pairs = 0;
+       total_pairs = 0;
+}
+
+
+
+
+
+
+OpenCVWrapper::~OpenCVWrapper()
+{
+// This releases all the arrays
+       if(storage) cvReleaseMemStorage(&storage);
+       if(object_image) cvReleaseImage(&object_image);
+       if(scene_image) cvReleaseImage(&scene_image);
+       if(point_pairs) free(point_pairs);
+}
+
+
+
+
+
+int OpenCVWrapper::scan(VFrame *object_frame,
+       VFrame *scene_frame,
+       int object_x1, 
+       int object_y1,
+       int object_x2,
+       int object_y2,
+       int scene_x1,
+       int scene_y1,
+       int scene_x2,
+       int scene_y2)
+{
+       int result = 0;
+       int object_w = object_x2 - object_x1;
+       int object_h = object_y2 - object_y1;
+       int scene_w = scene_x2 - scene_x1;
+       int scene_h = scene_y2 - scene_y1;
+
+
+//object_frame->write_png("/tmp/object.png");
+//scene_frame->write_png("/tmp/scene.png");
+
+// Get quantized sizes
+       int object_image_w = object_w;
+       int object_image_h = object_h;
+       int scene_image_w = scene_w;
+       int scene_image_h = scene_h;
+       if(object_w % QUANTIZE) object_image_w += QUANTIZE - (object_w % QUANTIZE);
+       if(object_h % QUANTIZE) object_image_h += QUANTIZE - (object_h % QUANTIZE);
+       if(scene_w % QUANTIZE) scene_image_w += QUANTIZE - (scene_w % QUANTIZE);
+       if(scene_h % QUANTIZE) scene_image_h += QUANTIZE - (scene_h % QUANTIZE);
+
+       if(object_image && 
+               (object_image_w != this->object_image_w ||
+               object_image_h != this->object_image_h))
+       {
+               cvReleaseImage(&object_image);
+               object_image = 0;
+       }
+       this->object_image_w = object_image_w;
+       this->object_image_h = object_image_h;
+
+       if(scene_image && 
+               (scene_image_w != this->scene_image_w ||
+               scene_image_h != this->scene_image_h))
+       {
+               cvReleaseImage(&scene_image);
+               scene_image = 0;
+       }
+       this->scene_image_w = scene_image_w;
+       this->scene_image_h = scene_image_h;
+
+
+       if(!object_image)
+       {
+// Only does greyscale
+               object_image = cvCreateImage( 
+                       cvSize(object_image_w, object_image_h), 
+                       8, 
+                       1);
+       }
+
+       if(!scene_image)
+       {
+// Only does greyscale
+               scene_image = cvCreateImage( 
+                       cvSize(scene_image_w, scene_image_h), 
+                       8, 
+                       1);
+       }
+
+// Select only region with image size
+// Does this do anything?
+       cvSetImageROI( object_image, cvRect( 0, 0, object_w, object_h ) );
+       cvSetImageROI( scene_image, cvRect( 0, 0, scene_w, scene_h ) );
+
+       grey_crop((unsigned char*)scene_image->imageData, 
+               scene_frame, 
+               scene_x1, 
+               scene_y1, 
+               scene_x2, 
+               scene_y2,
+               scene_image_w,
+               scene_image_h);
+       grey_crop((unsigned char*)object_image->imageData, 
+               object_frame, 
+               object_x1, 
+               object_y1, 
+               object_x2, 
+               object_y2,
+               object_image_w,
+               object_image_h);
+
+
+       if(!storage) storage = cvCreateMemStorage(0);
+       CvSURFParams params = cvSURFParams(500, 1);
+
+
+//printf("OpenCVWrapper::process_buffer %d\n", __LINE__);
+
+// TODO: make the surf data persistent & check for image changes instead
+       if(object_keypoints) cvClearSeq(object_keypoints);
+       if(object_descriptors) cvClearSeq(object_descriptors);
+       if(scene_keypoints) cvClearSeq(scene_keypoints);
+       if(scene_descriptors) cvClearSeq(scene_descriptors);
+       object_keypoints = 0;
+       object_descriptors = 0;
+       scene_keypoints = 0;
+       scene_descriptors = 0;
+
+// Free the image structures
+       if(point_pairs) free(point_pairs);
+       point_pairs = 0;
+
+
+       cvExtractSURF(object_image, 
+               0, 
+               &object_keypoints, 
+               &object_descriptors, 
+               storage, 
+               params,
+               0);
+
+//printf("OpenCVWrapper::scan %d object keypoints=%d\n", __LINE__, object_keypoints->total);
+// Draw the keypoints
+//             for(int i = 0; i < object_keypoints->total; i++)
+//             {
+//             CvSURFPoint* r1 = (CvSURFPoint*)cvGetSeqElem( object_keypoints, i );
+//                     int size = r1->size / 4;
+//                     draw_rect(frame[object_layer], 
+//                             r1->pt.x + object_x1 - size, 
+//                             r1->pt.y + object_y1 - size, 
+//                             r1->pt.x + object_x1 + size, 
+//                             r1->pt.y + object_y1 + size);
+//             }
+
+
+//printf("OpenCVWrapper::process_buffer %d\n", __LINE__);
+
+       cvExtractSURF(scene_image, 
+               0, 
+               &scene_keypoints, 
+               &scene_descriptors, 
+               storage, 
+               params,
+               0);
+
+// Draw the keypoints
+//             for(int i = 0; i < scene_keypoints->total; i++)
+//             {
+//             CvSURFPoint* r1 = (CvSURFPoint*)cvGetSeqElem( scene_keypoints, i );
+//                     int size = r1->size / 4;
+//                     draw_rect(frame[scene_layer], 
+//                             r1->pt.x + scene_x1 - size, 
+//                             r1->pt.y + scene_y1 - size, 
+//                             r1->pt.x + scene_x1 + size, 
+//                             r1->pt.y + scene_y1 + size);
+//             }
+
+// printf("OpenCVWrapper::scan %d %d %d scene keypoints=%d\n", 
+// __LINE__, 
+// scene_w,
+// scene_h,
+// scene_keypoints->total);
+
+       CvPoint src_corners[4] = 
+       {
+               { 0, 0 }, 
+               { object_w, 0 }, 
+               { object_w, object_h }, 
+               { 0, object_h }
+       };
+
+       for(int i = 0; i < 8; i++)
+       {
+               dst_corners[i] = 0;
+       }
+
+
+
+//printf("OpenCVWrapper::process_buffer %d\n", __LINE__);
+       if(scene_keypoints->total &&
+               object_keypoints->total &&
+               locatePlanarObject(object_keypoints, 
+                       object_descriptors, 
+                       scene_keypoints, 
+                       scene_descriptors, 
+                       src_corners, 
+                       &point_pairs,
+                       &total_pairs))
+       {
+               result = 1;
+       }
+
+
+       return result;
+}
+
+
+
+
+
+
+// Convert to greyscale & crop
+void OpenCVWrapper::grey_crop(unsigned char *dst, 
+       VFrame *src, 
+       int x1, 
+       int y1,
+       int x2,
+       int y2,
+       int dst_w,
+       int dst_h)
+{
+// Dimensions of dst frame
+       int w = x2 - x1;
+       int h = y2 - y1;
+
+       bzero(dst, dst_w * dst_h);
+
+//printf("OpenCVWrapper::grey_crop %d %d %d\n", __LINE__, w, h);
+       for(int i = 0; i < h; i++)
+       {
+               switch(src->get_color_model())
+               {
+                       case BC_RGB888:
+                               break;
+
+                       case BC_YUV888:
+                       {
+                               unsigned char *input = src->get_rows()[i + y1] + x1 * 3;
+                               unsigned char *output = dst + i * dst_w;
+
+                               for(int j = 0; j < w; j++)
+                               {
+// Y channel only
+                                       *output = *input;
+                                       input += 3;
+                                       output++;
+                               }
+                               break;
+                       }
+               }
+       }
+}
+
+
+float OpenCVWrapper::get_dst_x(int number)
+{
+       return dst_corners[number * 2];
+}
+
+float OpenCVWrapper::get_dst_y(int number)
+{
+       return dst_corners[number * 2 + 1];
+}
+
+
+
+
+