Hmax.H

Go to the documentation of this file.
00001 /*!@file HMAX/Hmax.H Riesenhuber & Poggio's HMAX model for object recognition */
00002 
00003 // //////////////////////////////////////////////////////////////////// //
00004 // The iLab Neuromorphic Vision C++ Toolkit - Copyright (C) 2001 by the //
00005 // University of Southern California (USC) and the iLab at USC.         //
00006 // See http://iLab.usc.edu for information about this project.          //
00007 // //////////////////////////////////////////////////////////////////// //
00008 // Major portions of the iLab Neuromorphic Vision Toolkit are protected //
00009 // under the U.S. patent ``Computation of Intrinsic Perceptual Saliency //
00010 // in Visual Environments, and Applications'' by Christof Koch and      //
00011 // Laurent Itti, California Institute of Technology, 2001 (patent       //
00012 // pending; application number 09/912,225 filed July 23, 2001; see      //
00013 // http://pair.uspto.gov/cgi-bin/final/home.pl for current status).     //
00014 // //////////////////////////////////////////////////////////////////// //
00015 // This file is part of the iLab Neuromorphic Vision C++ Toolkit.       //
00016 //                                                                      //
00017 // The iLab Neuromorphic Vision C++ Toolkit is free software; you can   //
00018 // redistribute it and/or modify it under the terms of the GNU General  //
00019 // Public License as published by the Free Software Foundation; either  //
00020 // version 2 of the License, or (at your option) any later version.     //
00021 //                                                                      //
00022 // The iLab Neuromorphic Vision C++ Toolkit is distributed in the hope  //
00023 // that it will be useful, but WITHOUT ANY WARRANTY; without even the   //
00024 // implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR      //
00025 // PURPOSE.  See the GNU General Public License for more details.       //
00026 //                                                                      //
00027 // You should have received a copy of the GNU General Public License    //
00028 // along with the iLab Neuromorphic Vision C++ Toolkit; if not, write   //
00029 // to the Free Software Foundation, Inc., 59 Temple Place, Suite 330,   //
00030 // Boston, MA 02111-1307 USA.                                           //
00031 // //////////////////////////////////////////////////////////////////// //
00032 //
00033 // Primary maintainer for this file: Laurent Itti <itti@usc.edu>
00034 // $HeadURL: svn://isvn.usc.edu/software/invt/trunk/saliency/src/HMAX/Hmax.H $
00035 // $Id: Hmax.H 14139 2010-10-16 02:11:21Z dparks $
00036 //
00037 
00038 #ifndef HMAX_H_DEFINED
00039 #define HMAX_H_DEFINED
00040 
00041 #include "Image/Image.H"
00042 #include <vector>
00043 
00044 #include <cmath>
00045 #include <string>
00046 #include <vector>
00047 #include <dirent.h>
00048 
00049 //! Object recognition model inspired from Riesenhuber & Poggio's HMAX model
00050 /*! See Riesenhuber & Poggio, Nature Neuroscience, 1999.
00051  */
00052 
00053 class Hmax {
00054 public:
00055   //! Default constructor. Need to call init() later.
00056   Hmax();
00057 
00058   //! Constructor
00059   Hmax(const int nori, const std::vector<int>& spacess,
00060        const std::vector<int>& scaless, const int c1spaceol = 2,
00061        const bool angleflag = true, const float s2t = 1.0F,
00062        const float s2s = 1.0F, const float stdmin = 1.75F,
00063        const float stdstep = 0.5F, const int fsmin = 3, const int fsstep = 1);
00064 
00065   //! Initialization
00066   void init(const int nori, const std::vector<int>& spacess,
00067             const std::vector<int>& scaless, const int c1spaceol = 2,
00068             const bool angleflag = true, const float s2t = 1.0F,
00069             const float s2s = 1.0F);
00070 
00071   void initFilters(const float stdmin, const float stdstep, const int fsmin, const int fsstep);
00072 
00073 
00074   //! Free internal memory
00075   void freeMem();
00076 
00077   //! Destructor
00078   ~Hmax();
00079 
00080   //! For utilize the operation : read a directory and pass the list of files
00081   std::vector<std::string> readDir(std::string dirName);
00082   std::vector<std::string> readList(std::string inName);
00083   //! This is the code of Max Riesenhuber almost straight out of the box
00084   Image<float> origGetC2(const Image<float>& imag);
00085 
00086   //! Compute C2 responses from an input image
00087   Image<float> getC2(const Image<float>& input);
00088   int getNumOrientations();
00089   void initC1(Image<float> **&c1Res);
00090   void clearC1(Image<float> **&c1Res);
00091   void printCorners(const char name[], const Image<float>& im, bool cond);
00092   void writeOutImage(const Image<float>& im,std::string & fName);
00093   // Calculate just the C1 level (must be public if you need to learn patches)
00094   void getC1(const Image<float>& input, Image<float>**& c1Res);
00095   void sumFilter(const Image<float>& image, const float radius, Image<float>& newImage);
00096   void sumFilter(const Image<float>& image, const Rectangle& support, Image<float>& newImage);
00097 
00098 protected:
00099   bool initialized; //!< keep track of whether we have allocated some memory
00100   int nsb; //!< number of scale bands
00101   int ns;  //!< number of scales
00102   int no;  //!< number of orientations
00103   Image<float> **filter; //!< low-level processing filters [ns][no]
00104 
00105   int c1SpaceOL;  //!< spatial overlap in C1 cells
00106   bool angleFlag; //!< normalize convolution by image energy if true
00107   float s2Target; //!< center of S2 target
00108   float s2Sigma;  //!< size of S2 target
00109 
00110   std::vector<int> spaceSS;
00111   std::vector<int> scaleSS;
00112 };
00113 
00114 #endif
00115 
00116 // ######################################################################
00117 /* So things look consistent in everyone's emacs... */
00118 /* Local Variables: */
00119 /* indent-tabs-mode: nil */
00120 /* End: */