~medici/adaboost/_boot_strap_procedure_8h_source.html

 /* XBoost: Ada-Boost and Friends on Haar/ICF/HOG Features, Library and ToolBox

  *

  * Copyright (c) 2008-2014 Paolo Medici <medici@ce.unipr.it>

  *

  * This library is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2 of the License, or (at your option) any later version.

  *

  * This library is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with this library; if not, write to the

  * Free Software Foundation, Inc., 59 Temple Place - Suite 330,

  * Boston, MA 02111-1307, USA.

  */


 #ifndef _BOOTSTRAP_PROCEDURE_H

 #define _BOOTSTRAP_PROCEDURE_H


 #include "NonMaximaSuppression.h"

 #include "Candidate.h"

 #include "IO/datasetin.h"

 #include "Utility/ResponseUtils.h"


 #ifdef _MULTITHREAD

 # include "Thread/thread.h"

 # include "Thread/thread_group.h"

 # include "Thread/bind.h"

 # include "Thread/ref.h"

 #endif  // #ifdef _MULTITHREADING


 struct BootStrapParams {

     float scale_factor;

     int negative_random_samples;

     int nms_step;

     int downsampling;

     double thMin;


     BootStrapParams() : scale_factor(1.0f), negative_random_samples(1), nms_step(1), downsampling(1), thMin(0.0) { }

 };


 extern int frameidx;


 template<class SourceDatasetType, class ClassifierType>

 bool BootStrapProcedure( SourceDatasetType & training_set,  datasetin & in, const ClassifierType& cl, const BootStrapParams & params, int num_thread)

 {

     int new_pattern = 0;

     datasetitem item;

     Timer t_elab;

     size sz;

     sz.width = training_set.width;

     sz.height = training_set.height;


     while(in.next(item))

     {

         Image img;


 #ifdef LIMIT_PER_FRAME

         // store

         std::vector< ImageHandle > image_scales;

         std::vector< Candidate > candidates;

 #endif


         // processo per il bootstrap solo le immagini con auto_negative

         if(item.auto_negative && pnm_load(item.filename.c_str(), img))

         {


             int src_width = img.width;

             int src_height = img.height;

             std::cout << "Testing classifier on " << item.filename << " (" << src_width << 'x' << src_height << ") with step " << params.downsampling << " [ID:" << frameidx << "]" << std::endl;

             std::vector<datasetobject> list = item.object;

             float scale = 1.0f;

             ImageResampler rsmp;

             bool first_scale = true;

             int n_negatives = 0;

             Timer t0;


             t0.Start();


             // iterate for all the octaves (it is a slightly different code compared to the one in ObjectDetector)

             for(;;) {

                 // the response is smaller than img because the window outside image are not considered

                 int w_r = ((int) img.width  - (int) sz.width)/params.downsampling;

                 int h_r = ((int) img.height - (int) sz.height)/params.downsampling;


                 std::cout << "\t" << img.width << 'x' << img.height << " (" << w_r << 'x' << h_r << ")... ";

                 std::cout.flush();


                 std::vector<Candidate>   elements;

                 elements.reserve(params.negative_random_samples);

                 typename SourceDatasetType::ReturnType Out;


                 // terminate check (if 3x3 image is provided)

                 if(h_r < 3 || w_r < 3)

                 {

                     std::cout << "\tWarn: response image too small\n";

                     break;

                 }


                 double* response = new double[w_r*h_r];


                 Timer t;


                 t.Start();


                 // precompute the preprocess image

                 training_set.Process(Out, img.data, img.width, img.height, img.stride);


                 // create the optimized version for the classifier:


                 typename ClassifierType::OptimizedType _Inst(cl, 0, Out.second);


                 double r_max,r_min;


 #ifdef _MULTITHREAD

                 if(num_thread > 1)

                 {

                     sprint::thread_group thread_pool_;

                     for(int ii=0; ii<num_thread; ii++)

                     {

                         int startH = (ii*h_r)/num_thread;

                         int endH =   ((ii+1)*h_r)/num_thread;


                         // about 20% increase in performances

                         // thread_pool_.create_thread(sprint::thread_bind(&workerResponse<typename SourceDatasetType::ReturnType,ClassifierType>,response,startH,endH,w_r, &cl, &Out ));

                         thread_pool_.create_thread(sprint::thread_bind(&optimizedWorkerResponse<typename SourceDatasetType::ReturnType, typename ClassifierType::OptimizedType>,response,startH,endH,w_r, sprint::c_ref(_Inst), sprint::c_ref(Out), params.downsampling ));

                     }


                     thread_pool_.join_all();

                 }

                 else

 #endif

                 {

                     // generate the response image

                     // about 20% increase in performances

                     // workerResponse(response, 0, h_r, w_r, &cl, &Out);

                     optimizedWorkerResponse(response, 0, h_r, w_r, _Inst, Out, params.downsampling);

                 }


                 double dt = t.GetTime();


                 r_min = *std::min_element(response,response+w_r*h_r);//dbg

                 r_max = *std::max_element(response,response+w_r*h_r);//dbg


                 std::cout << "\tr_max " << r_max << " | r_min " << r_min;

                 std::cout.flush();

                 // print RESPONSE to debug

                 /* {

                 Image test;

                 test.alloc(w_r, h_r, 3);

                 for(int j =0;j<h_r;++j)

                 for(int i =0;i<w_r;++i)

                 {

                   double r = response[i + j * w_r];

                   if(r>0.0)

                   {

                   unsigned char p = r * 255.0 / r_max;


                   test.data[3*i + test.stride *j+0] = 0;

                   test.data[3*i + test.stride *j+1] = p;

                   test.data[3*i + test.stride *j+2] = 0;

                   }

                   else

                   {

                   unsigned char p = -r * 255.0 / r_min;


                   test.data[3*i + test.stride *j+0] = 0;

                   test.data[3*i + test.stride *j+1] = 0;

                   test.data[3*i + test.stride *j+2] = p;

                   }

                 }

                 static int count = 0;

                 char buffer[256];

                 sprintf(buffer, "/tmp/r%06u.ppm", count);

                     count++;

                     pnm_write(test, buffer);

                 } */


                 std::vector<Candidate> tmpOut;


                 detail::CandidateParam param;


                 param.cl_geom.width = training_set.width;

                 param.cl_geom.height = training_set.height;

                 param.scale = 1.0; // image is extracted by downsampled directly and not from original size image

                 param.step = params.downsampling; // downsampling factor of response image

                 param.category = 0; // unused


                 // search non overlapping box TODO: this could be a parameter

                 int step = params.nms_step / params.downsampling;

                 NonMaximaSuppression(response, tmpOut, step, w_r, w_r, h_r, params.thMin, param, num_thread);


                 std::cout << " | detected: "<< tmpOut.size() << " in " << dt << "s";

                 std::cout.flush();


                 // TODO: check existance of NEGATIVE AREAs

                 /*  {

                   static int count = 0;

                   char buffer[256];

                   Image out;

                   out.clone(img);

                     for(int i=0; i<tmpOut.size(); i++)

                       DrawRect(out, rect( tmpOut[i].roi.x0, tmpOut[i].roi.y0, tmpOut[i].roi.x1-1, tmpOut[i].roi.y1-1), 255);

                   sprintf(buffer, "/tmp/test%06u.pgm", count);

                   count++;

                   pnm_write(out, buffer);

                   }  */


                 for(std::vector<Candidate>::const_iterator i = tmpOut.begin(); i != tmpOut.end(); ++i)

                 {

                     bool is_overlap = false;

                     // puo' solo overlappare dei negativi (non dovrebbero essercene comunque)

                     for(std::vector<datasetobject>::const_iterator j = list.begin(); j != list.end(); ++j)

                     {

                         if(j->category >= 0 && overlap(i->box, j->roi))

                         {

                             is_overlap = true;

                             break;

                         }

                     }


                     if(!is_overlap)

                     {

                         elements.push_back(*i);


                     }

                 }


                 // this code extract at least params.negative_random_samples elements per each scale

 #ifndef LIMIT_PER_FRAME

                 std::cout << " | " << elements.size() << "/" << params.negative_random_samples <<" false positives found" << std::endl;


                 // SORT (TODO or random sampling?)

                 if((int) elements.size() > params.negative_random_samples)

                 {

                     std::sort(elements.begin(), elements.end()); // sort from higher to lower

                     elements.resize(params.negative_random_samples); // erase

                 }


                 for(std::vector<Candidate>::const_iterator i = elements.begin(); i != elements.end(); ++i)

                 {

                     training_set.ImportImage(img.crop(i->box),-1);

                     n_negatives++;

                 }


                 new_pattern += elements.size();

 #else


                 // this code extract at least params.negative_random_samples elements per each frame

                 std::cout << " | " << elements.size() << " false positives found" << std::endl;


                 // crop all elements in candidates and store response and image, for further processing

                 for(std::vector<Candidate>::const_iterator i = elements.begin(); i != elements.end(); ++i)

                 {

                     std::pair<float, Image *> d;

                     d.first = i->response;

                     d.second = new Image;

                     d.second->clone( img.crop(i->roi) );

                     candidates.push_back(d);

                 }


 #endif


                 delete [] response;

                 Out.first.release(); // manually release preprocessed data


                 scale *= params.scale_factor;


                 // size of the response image for the next scale:

                 w_r = (int(src_width/scale)  - (int) sz.width) /params.downsampling;

                 h_r = (int(src_height/scale) - (int) sz.height)/params.downsampling;


                 // it is possible to search for additional scale?

                 // at least 4x4 response image need to be computed to make any sense

                 if(w_r > 3 && h_r > 3)

                 {


                     if(first_scale)

                     {

                         rsmp.ImportImage(img);

                         first_scale = false;

                     }


                     Image out;

                     out.alloc( (int) ((float)src_width/scale), (int) ((float)src_height/scale), 1);

                     rsmp.ExportImage(out);


                     for(unsigned int i=0; i<list.size(); ++i)

                     {   list[i].roi.x0 = floor((float)item.object[i].roi.x0 / scale);

                         list[i].roi.y0 = floor((float)item.object[i].roi.y0 / scale);

                         list[i].roi.x1 = ceil((float)item.object[i].roi.x1 / scale);

                         list[i].roi.y1 = ceil((float)item.object[i].roi.y1 / scale);

                     }


                     std::swap(img, out);


                     /* {

                     static int count = 0;

                     char buffer[256];

                     sprintf(buffer, "/tmp/downsample%06u.pgm", count);

                     count++;

                     pnm_write(img, buffer);

                     } */


                 }

                 else

                     break;

             }


 #ifdef LIMIT_PER_FRAME

             std::cout << "\t" << candidates.size() << "/" << params.negative_random_samples <<" total false positives found" << std::endl;


             // TODO: GroupRectangle?


             if(candidates.size() > params.negative_random_samples)

             {

                 std::sort(candidates.begin(), candidates.end());

             }


             int n = 0;

             for(std::vector<std::pair<float, Image *> >::const_iterator i = candidates.begin(); i != candidates.end(); ++i)

             {

                 if(n<params.negative_random_samples)

                     training_set.ImportImage(*i->second,-1);


                 delete i->second; // release pointer and associated memory

                 ++n;

             }


             new_pattern += candidates.size();

 #else

             std::cout << "\tFrame processed in " << t0.GetTime() << "s. " << n_negatives << " total new negatives imported.\n";

 #endif


             frameidx++;

         }

     }


     std::cout << "Bootstrap completed. " << new_pattern << " added to the negative pool.\n";


     return new_pattern == 0;

 }


 #endif

Image::clone
void clone(const ImageHandle &src)
clone an image
Definition: Image.h:104

frameidx
int frameidx
a counter, used for debug

Timer
Definition: timer.h:84

pnm_load
bool pnm_load(const char *file, Image &out)

BootStrapProcedure
bool BootStrapProcedure(SourceDatasetType &training_set, datasetin &in, const ClassifierType &cl, const BootStrapParams &params, int num_thread)
Definition: BootStrapProcedure.h:69

detail::CandidateParam::cl_geom
size cl_geom
classifier geometry
Definition: Candidate.h:39

BootStrapParams::downsampling
int downsampling
downsampling factor for computing response
Definition: BootStrapProcedure.h:50

detail::CandidateParam
parameters used in the NMS step
Definition: Candidate.h:33

datasetin
a virtual pure pattern list reader
Definition: datasetin.h:56

Image
a structure to hold image data (memory)
Definition: Image.h:74

NonMaximaSuppression.h
Implement a local maxima search algorithm.

ImageHandle::crop
ImageHandle crop(int x0, int y0, int x1, int y1) const
return a subpart of the image (without copy)
Definition: Image.h:47

optimizedWorkerResponse
void optimizedWorkerResponse(double *r, int startH, int endH, int W, const ClassifierType &cl, const ReturnType &out, int step)
Definition: ResponseUtils.h:59

ref.h
reference ref class

detail::CandidateParam::step
int step
response step. Multiplication factor to convert from (x,y) to box coordinates
Definition: Candidate.h:37

ClassifierType
ClassifierType
Definition: Types.h:31

BootStrapParams::negative_random_samples
int negative_random_samples
max number of negative extract per frame or per scale
Definition: BootStrapProcedure.h:46

detail::CandidateParam::category
int category
category
Definition: Candidate.h:41

BootStrapParams::scale_factor
float scale_factor
scale factor between two images
Definition: BootStrapProcedure.h:44

BootStrapParams
Parameters for BootStrapProcedure.
Definition: BootStrapProcedure.h:42

BootStrapParams::thMin
double thMin
threshold
Definition: BootStrapProcedure.h:52

sprint::thread_group
Definition: thread_group.h:82

size
image/size TODO namespace
Definition: Types.h:39

thread.h
abstracting thread

sprint::thread_group::join_all
void join_all()
wait all threads terminate
Definition: thread_group.h:114

thread_group.h
proposal 1 for thread group

ResponseUtils.h
helping method used during resposne computations

ImageHandle::stride
long stride
line stride, the delta offset, in bytes, between two different scanline
Definition: Image.h:41

BootStrapParams::nms_step
int nms_step
non maxima suppression step
Definition: BootStrapProcedure.h:48

bind.h
method to create function pointer for thread call

sprint::thread_group::create_thread
bool create_thread(const sprint::thread_function &p)
create an additional thread
Definition: thread_group.h:102

datasetitem
an item used for positive
Definition: datasetin.h:44

ImageHandle::width
unsigned int width
image geometry
Definition: Image.h:39

datasetitem::object
std::vector< datasetobject > object
List of object.
Definition: datasetin.h:52

overlap
bool overlap(const rect &a, const rect &b)
test if 2 rect are overlapped

datasetin.h
virtual class to import images

datasetitem::filename
std::string filename
filename
Definition: datasetin.h:46

ImageResampler
Definition: ImageUtils.h:35

Candidate.h
Candidate object.

ImageHandle::data
unsigned char * data
initial address of the first pixel. It must be cast to correct format (uint8, uint16, rgb, etc etc)
Definition: Image.h:43

NonMaximaSuppression
void NonMaximaSuppression(const D *src, FeatureListType &maxima, unsigned int n, long stride, unsigned int width, unsigned int height, D threshold, Param param, int nThreads=sprint::thread::hardware_concurrency())
Definition: NonMaximaSuppression.h:167

datasetitem::auto_negative
bool auto_negative
if the rest of the blob can be used as source for negative
Definition: datasetin.h:50

Image::alloc
void alloc(unsigned int w, unsigned int h, unsigned int b)
reserve memory for the image
Definition: Image.h:98

detail::CandidateParam::scale
float scale
detection scale. Multiplication factor to convert from (x,y) and size to box coordinates ...
Definition: Candidate.h:35