runcudahmaxfl.C

00001 /*!@file HMAX/test-hmax5.C Test Hmax class and compare to original code */
00002 
00003 // //////////////////////////////////////////////////////////////////// //
00004 // The iLab Neuromorphic Vision C++ Toolkit - Copyright (C) 2001 by the //
00005 // University of Southern California (USC) and the iLab at USC.         //
00006 // See http://iLab.usc.edu for information about this project.          //
00007 // //////////////////////////////////////////////////////////////////// //
00008 // Major portions of the iLab Neuromorphic Vision Toolkit are protected //
00009 // under the U.S. patent ``Computation of Intrinsic Perceptual Saliency //
00010 // in Visual Environments, and Applications'' by Christof Koch and      //
00011 // Laurent Itti, California Institute of Technology, 2001 (patent       //
00012 // pending; application number 09/912,225 filed July 23, 2001; see      //
00013 // http://pair.uspto.gov/cgi-bin/final/home.pl for current status).     //
00014 // //////////////////////////////////////////////////////////////////// //
00015 // This file is part of the iLab Neuromorphic Vision C++ Toolkit.       //
00016 //                                                                      //
00017 // The iLab Neuromorphic Vision C++ Toolkit is free software; you can   //
00018 // redistribute it and/or modify it under the terms of the GNU General  //
00019 // Public License as published by the Free Software Foundation; either  //
00020 // version 2 of the License, or (at your option) any later version.     //
00021 //                                                                      //
00022 // The iLab Neuromorphic Vision C++ Toolkit is distributed in the hope  //
00023 // that it will be useful, but WITHOUT ANY WARRANTY; without even the   //
00024 // implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR      //
00025 // PURPOSE.  See the GNU General Public License for more details.       //
00026 //                                                                      //
00027 // You should have received a copy of the GNU General Public License    //
00028 // along with the iLab Neuromorphic Vision C++ Toolkit; if not, write   //
00029 // to the Free Software Foundation, Inc., 59 Temple Place, Suite 330,   //
00030 // Boston, MA 02111-1307 USA.                                           //
00031 // //////////////////////////////////////////////////////////////////// //
00032 //
00033 // Primary maintainer for this file: Dan Parks <danielfp@usc.edu>
00034 // $HeadURL: svn://isvn.usc.edu/software/invt/trunk/saliency/src/CUDA/runcudahmaxfl.C $
00035 // $Id: runcudahmaxfl.C 12962 2010-03-06 02:13:53Z irock $
00036 //
00037 
00038 #include "Component/ModelManager.H"
00039 #include "GUI/XWindow.H"
00040 #include "CUDA/CudaHmaxFL.H"
00041 #include "CUDA/CudaHmax.H"
00042 #include "Image/Image.H"
00043 #include "Image/ColorOps.H"
00044 #include "Image/CutPaste.H"
00045 #include "Image/Rectangle.H"
00046 #include "Image/MathOps.H"
00047 #include "Image/MatrixOps.H"
00048 #include "Image/Transforms.H"
00049 #include "Image/Convolutions.H"
00050 #include "Learn/svm.h"
00051 #include "Media/FrameSeries.H"
00052 #include "nub/ref.h"
00053 #include "Raster/GenericFrame.H"
00054 #include "Raster/Raster.H"
00055 #include "Util/Types.H"
00056 #include "Util/log.H"
00057 
00058 #include <fstream>
00059 #include <iostream>
00060 #include <iomanip>
00061 #include <string>
00062 #include <unistd.h>
00063 #include <cstdlib>
00064 
00065 
00066 // number of orientations to use in HmaxFL
00067 #define NORI 4
00068 #define NUM_PATCHES_PER_SIZE 250
00069 
00070 int main(const int argc, const char **argv)
00071 {
00072 
00073   MYLOGVERB = LOG_INFO;
00074 
00075   ModelManager *mgr = new ModelManager("Test Hmax with Feature Learning");
00076 
00077 
00078   mgr->exportOptions(MC_RECURSE);
00079 
00080   // required arguments
00081   // <c1patchesDir> <dir|list> <id> <outputfile>
00082   //
00083   // <id> is the given id for the given set of images
00084   // --in only needs to happen if we are loading the patches
00085 
00086   if (mgr->parseCommandLine(
00087                             (const int)argc, (const char**)argv, "<cudadev> <c1patchesDir> <dir|list:images> <id> <outputfile>", 5, 5) == false)
00088     return 1;
00089 
00090   std::string loadImagesOption = mgr->getExtraArg(1);
00091   std::string c1PatchesBaseDir;
00092   std::string images,idArg,devArg;
00093   std::string c2FileName;
00094 
00095   std::string trainPosName; // Directory where positive images are
00096 
00097   int id;
00098 
00099   devArg = mgr->getExtraArg(0);
00100   c1PatchesBaseDir = mgr->getExtraArg(1);
00101   images = mgr->getExtraArg(2);
00102   idArg = mgr->getExtraArg(3);
00103   c2FileName = mgr->getExtraArg(4);
00104 
00105   MemoryPolicy mp = GLOBAL_DEVICE_MEMORY;
00106   int dev = strtol(devArg.c_str(),NULL,0);
00107   std::string::size_type dirArg=images.find("dir:",0);
00108   std::string::size_type listArg=images.find("list:",0);
00109   if((dirArg == std::string::npos &&
00110       listArg == std::string::npos) ||
00111      (dirArg != 0 && listArg != 0)){
00112     LFATAL("images argument is in one of the following formats -  dir:<DIRNAME>  or  list:<LISTOFIMAGEPATHSFILE>");
00113     return EXIT_FAILURE;
00114   }
00115   if(dirArg == 0)
00116     images = images.substr(4);
00117   else
00118     images = images.substr(5);
00119 
00120   id = strtol(idArg.c_str(),NULL,0);
00121 
00122 
00123   // get an HmaxFL object:
00124   std::vector<int> scss(9);
00125   scss[0] = 1; scss[1] = 3; scss[2] = 5; scss[3] = 7; scss[4] = 9;
00126   scss[5] = 11; scss[6] = 13; scss[7] = 15; scss[8] = 17;
00127   std::vector<int> spss(8);
00128   spss[0] = 8; spss[1] = 10; spss[2] = 12; spss[3] = 14;
00129   spss[4] = 16; spss[5] = 18; spss[6] = 20; spss[7] = 22;
00130   // std::vector<int> scss(4);
00131   // scss[0] = 3; scss[1] = 7; scss[2] = 11; scss[3] = 15;
00132   // std::vector<int> spss(4);
00133   // spss[0] = 10; spss[1] = 14; spss[2] = 18; spss[3] = 22;
00134 
00135   CudaHmaxFL hmax(mp,dev,NORI, spss, scss);
00136 
00137 
00138 
00139 
00140   //
00141   hmax.readInC1Patches(c1PatchesBaseDir);
00142   // Now we run if needed
00143   mgr->start();
00144 
00145   std::vector<std::string> imageNames;
00146   if(dirArg == 0)
00147     imageNames = hmax.readDir(images);
00148   else
00149     imageNames = hmax.readList(images);
00150 
00151   std::ofstream c2File;
00152   c2File.open(c2FileName.c_str(),std::ios::out);
00153 
00154   std::vector<int> patchSizes = hmax.getC1PatchSizes();
00155   float **c2Res = new float*[patchSizes.size()];
00156   for(unsigned int i=0;i<patchSizes.size();i++) {
00157     c2Res[i] = new float[NUM_PATCHES_PER_SIZE];
00158   }
00159 
00160   for(unsigned int imgInd=0;imgInd<imageNames.size();imgInd++){
00161     Image<float> inputf = Raster::ReadGrayNTSC(imageNames[imgInd]);
00162 
00163     // Output the c2 responses per patch into a libsvm
00164     // (or equivalently osusvm) style format
00165 
00166     //hmax.printCorners("inputf",inputf,1);
00167     hmax.getC2(CudaImage<float>(inputf,mp,dev),c2Res);
00168     std::cout <<"C2 Processing Complete: " << imgInd << std::endl;
00169     if (c2File.is_open()) {
00170       c2File << id << " ";
00171       for(unsigned int i=0;i<patchSizes.size();i++) {
00172         for(int j=0;j<NUM_PATCHES_PER_SIZE;j++) {
00173           c2File << std::setiosflags(std::ios::fixed) << std::setprecision(4) <<
00174             (i*NUM_PATCHES_PER_SIZE+j+1) << ":" << c2Res[i][j] << " ";
00175         }
00176       }
00177       c2File << std::endl;
00178     }
00179     std::cout <<"C2 Output Written: " << imgInd << std::endl;
00180   }
00181 
00182   for(unsigned int i=0;i<patchSizes.size();i++) {
00183     delete[] c2Res[i];
00184   }
00185   delete [] c2Res;
00186 
00187   c2File.close();
00188   return 0;
00189 }
00190 
00191 
00192 // ######################################################################
00193 /* So things look consistent in everyone's emacs... */
00194 /* Local Variables: */
00195 /* indent-tabs-mode: nil */
00196 /* End: */