00001 /*!@file INVT/neovision2.C CUDA-accelerated Neovision2 integrated demo */ 00002 00003 // //////////////////////////////////////////////////////////////////// // 00004 // The iLab Neuromorphic Vision C++ Toolkit - Copyright (C) 2000-2005 // 00005 // by the University of Southern California (USC) and the iLab at USC. // 00006 // See http://iLab.usc.edu for information about this project. // 00007 // //////////////////////////////////////////////////////////////////// // 00008 // Major portions of the iLab Neuromorphic Vision Toolkit are protected // 00009 // under the U.S. patent ``Computation of Intrinsic Perceptual Saliency // 00010 // in Visual Environments, and Applications'' by Christof Koch and // 00011 // Laurent Itti, California Institute of Technology, 2001 (patent // 00012 // pending; application number 09/912,225 filed July 23, 2001; see // 00013 // http://pair.uspto.gov/cgi-bin/final/home.pl for current status). // 00014 // //////////////////////////////////////////////////////////////////// // 00015 // This file is part of the iLab Neuromorphic Vision C++ Toolkit. // 00016 // // 00017 // The iLab Neuromorphic Vision C++ Toolkit is free software; you can // 00018 // redistribute it and/or modify it under the terms of the GNU General // 00019 // Public License as published by the Free Software Foundation; either // 00020 // version 2 of the License, or (at your option) any later version. // 00021 // // 00022 // The iLab Neuromorphic Vision C++ Toolkit is distributed in the hope // 00023 // that it will be useful, but WITHOUT ANY WARRANTY; without even the // 00024 // implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR // 00025 // PURPOSE. See the GNU General Public License for more details. // 00026 // // 00027 // You should have received a copy of the GNU General Public License // 00028 // along with the iLab Neuromorphic Vision C++ Toolkit; if not, write // 00029 // to the Free Software Foundation, Inc., 59 Temple Place, Suite 330, // 00030 // Boston, MA 02111-1307 USA. // 00031 // //////////////////////////////////////////////////////////////////// // 00032 // 00033 // Primary maintainer for this file: Rob Peters <rjpeters at usc dot edu> 00034 // $HeadURL: svn://isvn.usc.edu/software/invt/trunk/saliency/src/INVT/neovision2-cuda.C $ 00035 // $Id: neovision2-cuda.C 13232 2010-04-15 02:15:06Z dparks $ 00036 // 00037 00038 #include "Component/ModelManager.H" 00039 #include "Image/ColorOps.H" 00040 #include "Image/CutPaste.H" 00041 #include "Image/DrawOps.H" 00042 #include "Image/FilterOps.H" 00043 #include "Image/Image.H" 00044 #include "Image/ImageSet.H" 00045 #include "Image/Layout.H" 00046 #include "Image/MathOps.H" 00047 #include "Image/Pixels.H" 00048 #include "Image/PyramidOps.H" 00049 #include "Image/ShapeOps.H" 00050 #include "Image/Transforms.H" 00051 #include "Media/FrameSeries.H" 00052 #include "Media/MediaOpts.H" 00053 #include "Raster/GenericFrame.H" 00054 #include "Raster/Raster.H" 00055 #include "Transport/FrameInfo.H" 00056 #include "Transport/TransportOpts.H" 00057 #include "Util/csignals.H" 00058 #include "rutz/shared_ptr.h" 00059 #include "rutz/trace.h" 00060 #include "rutz/rand.h" 00061 00062 #include "CUDA/CudaSaliency.H" 00063 00064 #include <ctype.h> 00065 #include <deque> 00066 #include <iterator> 00067 #include <limits> 00068 #include <stdlib.h> // for atoi(), malloc(), free() 00069 #include <string.h> 00070 #include <sys/resource.h> 00071 #include <signal.h> 00072 #include <time.h> 00073 #include <vector> 00074 00075 00076 00077 // ###################################################################### 00078 int submain(int argc, const char** argv) 00079 { 00080 volatile int signum = 0; 00081 signal(SIGPIPE, SIG_IGN); 00082 catchsignals(&signum); 00083 00084 // Instantiate our various ModelComponents: 00085 00086 ModelManager manager("Nv2"); 00087 00088 nub::ref<InputFrameSeries> ifs(new InputFrameSeries(manager)); 00089 manager.addSubComponent(ifs); 00090 00091 nub::ref<OutputFrameSeries> ofs(new OutputFrameSeries(manager)); 00092 manager.addSubComponent(ofs); 00093 00094 nub::ref<CudaSaliency> cus(new CudaSaliency(manager)); 00095 manager.addSubComponent(cus); 00096 00097 if (manager.parseCommandLine((const int)argc, (const char**)argv, "<sampleimagesdir>", 1, 1) == false) 00098 return 1; 00099 00100 manager.exportOptions(MC_RECURSE); 00101 00102 manager.start(); 00103 00104 std::string sampleImagesDir; 00105 00106 sampleImagesDir = manager.getExtraArg(0); 00107 00108 00109 int retval = 0; 00110 ifs->startStream(); 00111 const GenericFrameSpec fspec = ifs->peekFrameSpec(); 00112 Image<PixRGB<byte> > rgbin_last; 00113 // Randomize the seed 00114 //rutz::urand r(time((time_t*)0) + getpid()); 00115 // Don't randomize the seed, i want the same frames each time 00116 rutz::urand r(0); 00117 00118 int curPickedFrame=0; 00119 00120 while (true) 00121 { 00122 if (signum != 0) { 00123 LINFO("quitting because %s was caught", signame(signum)); 00124 retval = -1; 00125 break; 00126 } 00127 00128 if (ofs->becameVoid()) { 00129 LINFO("quitting because output stream was closed or became void"); 00130 break; 00131 } 00132 00133 // 00134 // get the next frame from our input source 00135 // 00136 const FrameState is = ifs->updateNext(); 00137 if (is == FRAME_COMPLETE) break; 00138 00139 GenericFrame input = ifs->readFrame(); 00140 if (!input.initialized()) break; 00141 00142 const Image<PixRGB<byte> > rgbin = input.asRgb(); 00143 00144 rgbin_last = rgbin; 00145 cus->doInput(rgbin); 00146 00147 00148 // Sub sample video, randomly pick roughly every N frames 00149 int willPick = r.idraw(100); 00150 00151 if(willPick==0) 00152 { 00153 //Different Maps 00154 CudaImage<float> out = cus->getCudaOutput(); 00155 00156 std::vector<Point2D<int> > loc = cus->getSalMaxLoc(); 00157 00158 int rectW = cus->getPatchSize(); 00159 int rectH = cus->getPatchSize(); 00160 00161 for(unsigned int i=0; i<loc.size(); i++) 00162 { 00163 Point2D<int> modLoc; 00164 modLoc.i = loc[i].i * rgbin.getWidth() / double(out.getWidth()); 00165 modLoc.j = loc[i].j * rgbin.getHeight() / double(out.getHeight()); 00166 00167 int fi = std::max(modLoc.i-int(rectW/2.0),0); 00168 int fj = std::max(modLoc.j-int(rectH/2.0),0); 00169 Point2D<int> p = Point2D<int>(fi,fj); 00170 Rectangle foa = Rectangle(p,Dims(rectW,rectH)); 00171 printf("FOA:<%s> ",convertToString(modLoc).c_str()); 00172 Image<PixRGB<byte> > patch = crop(rgbin,foa); 00173 Image<PixRGB<byte> > patchResize = rescale(patch, 256, 256); 00174 00175 char fname[200]; 00176 sprintf(fname,"%s/Sample-%d-%d.png",sampleImagesDir.c_str(),curPickedFrame,i); 00177 Raster::WriteRGB(patchResize,fname); 00178 00179 } 00180 printf("\n"); 00181 curPickedFrame++; 00182 } 00183 00184 } 00185 00186 manager.stop(); 00187 return retval; 00188 } 00189 00190 // ###################################################################### 00191 int main(int argc, const char** argv) 00192 { 00193 try { 00194 return submain(argc, argv); 00195 } catch (...) { 00196 REPORT_CURRENT_EXCEPTION; 00197 } 00198 } 00199 00200 // ###################################################################### 00201 /* So things look consistent in everyone's emacs... */ 00202 /* Local Variables: */ 00203 /* mode: c++ */ 00204 /* indent-tabs-mode: nil */ 00205 /* End: */