00001 /*!@file HMAX/test-hmax5.C Test Hmax class and compare to original code */ 00002 00003 // //////////////////////////////////////////////////////////////////// // 00004 // The iLab Neuromorphic Vision C++ Toolkit - Copyright (C) 2001 by the // 00005 // University of Southern California (USC) and the iLab at USC. // 00006 // See http://iLab.usc.edu for information about this project. // 00007 // //////////////////////////////////////////////////////////////////// // 00008 // Major portions of the iLab Neuromorphic Vision Toolkit are protected // 00009 // under the U.S. patent ``Computation of Intrinsic Perceptual Saliency // 00010 // in Visual Environments, and Applications'' by Christof Koch and // 00011 // Laurent Itti, California Institute of Technology, 2001 (patent // 00012 // pending; application number 09/912,225 filed July 23, 2001; see // 00013 // http://pair.uspto.gov/cgi-bin/final/home.pl for current status). // 00014 // //////////////////////////////////////////////////////////////////// // 00015 // This file is part of the iLab Neuromorphic Vision C++ Toolkit. // 00016 // // 00017 // The iLab Neuromorphic Vision C++ Toolkit is free software; you can // 00018 // redistribute it and/or modify it under the terms of the GNU General // 00019 // Public License as published by the Free Software Foundation; either // 00020 // version 2 of the License, or (at your option) any later version. // 00021 // // 00022 // The iLab Neuromorphic Vision C++ Toolkit is distributed in the hope // 00023 // that it will be useful, but WITHOUT ANY WARRANTY; without even the // 00024 // implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR // 00025 // PURPOSE. See the GNU General Public License for more details. // 00026 // // 00027 // You should have received a copy of the GNU General Public License // 00028 // along with the iLab Neuromorphic Vision C++ Toolkit; if not, write // 00029 // to the Free Software Foundation, Inc., 59 Temple Place, Suite 330, // 00030 // Boston, MA 02111-1307 USA. // 00031 // //////////////////////////////////////////////////////////////////// // 00032 // 00033 // Primary maintainer for this file: Dan Parks <danielfp@usc.edu> 00034 // $HeadURL: svn://isvn.usc.edu/software/invt/trunk/saliency/src/CUDA/runcudahmaxfl.C $ 00035 // $Id: runcudahmaxfl.C 12962 2010-03-06 02:13:53Z irock $ 00036 // 00037 00038 #include "Component/ModelManager.H" 00039 #include "GUI/XWindow.H" 00040 #include "CUDA/CudaHmaxFL.H" 00041 #include "CUDA/CudaHmax.H" 00042 #include "Image/Image.H" 00043 #include "Image/ColorOps.H" 00044 #include "Image/CutPaste.H" 00045 #include "Image/Rectangle.H" 00046 #include "Image/MathOps.H" 00047 #include "Image/MatrixOps.H" 00048 #include "Image/Transforms.H" 00049 #include "Image/Convolutions.H" 00050 #include "Learn/svm.h" 00051 #include "Media/FrameSeries.H" 00052 #include "nub/ref.h" 00053 #include "Raster/GenericFrame.H" 00054 #include "Raster/Raster.H" 00055 #include "Util/Types.H" 00056 #include "Util/log.H" 00057 00058 #include <fstream> 00059 #include <iostream> 00060 #include <iomanip> 00061 #include <string> 00062 #include <unistd.h> 00063 #include <cstdlib> 00064 00065 00066 // number of orientations to use in HmaxFL 00067 #define NORI 4 00068 #define NUM_PATCHES_PER_SIZE 250 00069 00070 int main(const int argc, const char **argv) 00071 { 00072 00073 MYLOGVERB = LOG_INFO; 00074 00075 ModelManager *mgr = new ModelManager("Test Hmax with Feature Learning"); 00076 00077 00078 mgr->exportOptions(MC_RECURSE); 00079 00080 // required arguments 00081 // <c1patchesDir> <dir|list> <id> <outputfile> 00082 // 00083 // <id> is the given id for the given set of images 00084 // --in only needs to happen if we are loading the patches 00085 00086 if (mgr->parseCommandLine( 00087 (const int)argc, (const char**)argv, "<cudadev> <c1patchesDir> <dir|list:images> <id> <outputfile>", 5, 5) == false) 00088 return 1; 00089 00090 std::string loadImagesOption = mgr->getExtraArg(1); 00091 std::string c1PatchesBaseDir; 00092 std::string images,idArg,devArg; 00093 std::string c2FileName; 00094 00095 std::string trainPosName; // Directory where positive images are 00096 00097 int id; 00098 00099 devArg = mgr->getExtraArg(0); 00100 c1PatchesBaseDir = mgr->getExtraArg(1); 00101 images = mgr->getExtraArg(2); 00102 idArg = mgr->getExtraArg(3); 00103 c2FileName = mgr->getExtraArg(4); 00104 00105 MemoryPolicy mp = GLOBAL_DEVICE_MEMORY; 00106 int dev = strtol(devArg.c_str(),NULL,0); 00107 std::string::size_type dirArg=images.find("dir:",0); 00108 std::string::size_type listArg=images.find("list:",0); 00109 if((dirArg == std::string::npos && 00110 listArg == std::string::npos) || 00111 (dirArg != 0 && listArg != 0)){ 00112 LFATAL("images argument is in one of the following formats - dir:<DIRNAME> or list:<LISTOFIMAGEPATHSFILE>"); 00113 return EXIT_FAILURE; 00114 } 00115 if(dirArg == 0) 00116 images = images.substr(4); 00117 else 00118 images = images.substr(5); 00119 00120 id = strtol(idArg.c_str(),NULL,0); 00121 00122 00123 // get an HmaxFL object: 00124 std::vector<int> scss(9); 00125 scss[0] = 1; scss[1] = 3; scss[2] = 5; scss[3] = 7; scss[4] = 9; 00126 scss[5] = 11; scss[6] = 13; scss[7] = 15; scss[8] = 17; 00127 std::vector<int> spss(8); 00128 spss[0] = 8; spss[1] = 10; spss[2] = 12; spss[3] = 14; 00129 spss[4] = 16; spss[5] = 18; spss[6] = 20; spss[7] = 22; 00130 // std::vector<int> scss(4); 00131 // scss[0] = 3; scss[1] = 7; scss[2] = 11; scss[3] = 15; 00132 // std::vector<int> spss(4); 00133 // spss[0] = 10; spss[1] = 14; spss[2] = 18; spss[3] = 22; 00134 00135 CudaHmaxFL hmax(mp,dev,NORI, spss, scss); 00136 00137 00138 00139 00140 // 00141 hmax.readInC1Patches(c1PatchesBaseDir); 00142 // Now we run if needed 00143 mgr->start(); 00144 00145 std::vector<std::string> imageNames; 00146 if(dirArg == 0) 00147 imageNames = hmax.readDir(images); 00148 else 00149 imageNames = hmax.readList(images); 00150 00151 std::ofstream c2File; 00152 c2File.open(c2FileName.c_str(),std::ios::out); 00153 00154 std::vector<int> patchSizes = hmax.getC1PatchSizes(); 00155 float **c2Res = new float*[patchSizes.size()]; 00156 for(unsigned int i=0;i<patchSizes.size();i++) { 00157 c2Res[i] = new float[NUM_PATCHES_PER_SIZE]; 00158 } 00159 00160 for(unsigned int imgInd=0;imgInd<imageNames.size();imgInd++){ 00161 Image<float> inputf = Raster::ReadGrayNTSC(imageNames[imgInd]); 00162 00163 // Output the c2 responses per patch into a libsvm 00164 // (or equivalently osusvm) style format 00165 00166 //hmax.printCorners("inputf",inputf,1); 00167 hmax.getC2(CudaImage<float>(inputf,mp,dev),c2Res); 00168 std::cout <<"C2 Processing Complete: " << imgInd << std::endl; 00169 if (c2File.is_open()) { 00170 c2File << id << " "; 00171 for(unsigned int i=0;i<patchSizes.size();i++) { 00172 for(int j=0;j<NUM_PATCHES_PER_SIZE;j++) { 00173 c2File << std::setiosflags(std::ios::fixed) << std::setprecision(4) << 00174 (i*NUM_PATCHES_PER_SIZE+j+1) << ":" << c2Res[i][j] << " "; 00175 } 00176 } 00177 c2File << std::endl; 00178 } 00179 std::cout <<"C2 Output Written: " << imgInd << std::endl; 00180 } 00181 00182 for(unsigned int i=0;i<patchSizes.size();i++) { 00183 delete[] c2Res[i]; 00184 } 00185 delete [] c2Res; 00186 00187 c2File.close(); 00188 return 0; 00189 } 00190 00191 00192 // ###################################################################### 00193 /* So things look consistent in everyone's emacs... */ 00194 /* Local Variables: */ 00195 /* indent-tabs-mode: nil */ 00196 /* End: */