Avoid obtaining several identical dimensions between two LSH sub-vectors by choosing...
authorPierre-Emmanuel Viel <p.emmanuel.viel@gmail.com>
Thu, 26 Dec 2013 18:44:23 +0000 (19:44 +0100)
committerPierre-Emmanuel Viel <p.emmanuel.viel@gmail.com>
Thu, 26 Dec 2013 18:44:23 +0000 (19:44 +0100)
modules/flann/include/opencv2/flann/lsh_table.h

index b0f3223..6b8d614 100644 (file)
@@ -348,13 +348,21 @@ inline LshTable<unsigned char>::LshTable(unsigned int feature_size, unsigned int
     mask_ = std::vector<size_t>((size_t)ceil((float)(feature_size * sizeof(char)) / (float)sizeof(size_t)), 0);
 
     // A bit brutal but fast to code
-    std::vector<size_t> indices(feature_size * CHAR_BIT);
-    for (size_t i = 0; i < feature_size * CHAR_BIT; ++i) indices[i] = i;
-    std::random_shuffle(indices.begin(), indices.end());
+    static std::vector<size_t> indices(feature_size * CHAR_BIT);
+
+    //Ensure the Nth bit will be selected only once among the different LshTables
+    //to avoid having two different tables with signatures sharing many dimensions/many bits
+    if( (indices.size() == feature_size * CHAR_BIT) || (indices.size() < key_size_) )
+    {
+      indices.resize( feature_size * CHAR_BIT );
+      for (size_t i = 0; i < feature_size * CHAR_BIT; ++i) indices[i] = i;
+      std::random_shuffle(indices.begin(), indices.end());
+    }
 
     // Generate a random set of order of subsignature_size_ bits
     for (unsigned int i = 0; i < key_size_; ++i) {
-        size_t index = indices[i];
+        size_t index = indices[0];
+        indices.erase( indices.begin() );
 
         // Set that bit in the mask
         size_t divisor = CHAR_BIT * sizeof(size_t);