TigsInputFrame.C

Go to the documentation of this file.
00001 /*!@file TIGS/TigsInputFrame.C Class that lets us do lazy computation of luminance/rg/by from an input frame */
00002 
00003 // //////////////////////////////////////////////////////////////////// //
00004 // The iLab Neuromorphic Vision C++ Toolkit - Copyright (C) 2000-2005   //
00005 // by the University of Southern California (USC) and the iLab at USC.  //
00006 // See http://iLab.usc.edu for information about this project.          //
00007 // //////////////////////////////////////////////////////////////////// //
00008 // Major portions of the iLab Neuromorphic Vision Toolkit are protected //
00009 // under the U.S. patent ``Computation of Intrinsic Perceptual Saliency //
00010 // in Visual Environments, and Applications'' by Christof Koch and      //
00011 // Laurent Itti, California Institute of Technology, 2001 (patent       //
00012 // pending; application number 09/912,225 filed July 23, 2001; see      //
00013 // http://pair.uspto.gov/cgi-bin/final/home.pl for current status).     //
00014 // //////////////////////////////////////////////////////////////////// //
00015 // This file is part of the iLab Neuromorphic Vision C++ Toolkit.       //
00016 //                                                                      //
00017 // The iLab Neuromorphic Vision C++ Toolkit is free software; you can   //
00018 // redistribute it and/or modify it under the terms of the GNU General  //
00019 // Public License as published by the Free Software Foundation; either  //
00020 // version 2 of the License, or (at your option) any later version.     //
00021 //                                                                      //
00022 // The iLab Neuromorphic Vision C++ Toolkit is distributed in the hope  //
00023 // that it will be useful, but WITHOUT ANY WARRANTY; without even the   //
00024 // implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR      //
00025 // PURPOSE.  See the GNU General Public License for more details.       //
00026 //                                                                      //
00027 // You should have received a copy of the GNU General Public License    //
00028 // along with the iLab Neuromorphic Vision C++ Toolkit; if not, write   //
00029 // to the Free Software Foundation, Inc., 59 Temple Place, Suite 330,   //
00030 // Boston, MA 02111-1307 USA.                                           //
00031 // //////////////////////////////////////////////////////////////////// //
00032 //
00033 // Primary maintainer for this file: Rob Peters <rjpeters at usc dot edu>
00034 // $HeadURL: svn://isvn.usc.edu/software/invt/trunk/saliency/src/TIGS/TigsInputFrame.C $
00035 // $Id: TigsInputFrame.C 8297 2007-04-25 00:26:17Z rjpeters $
00036 //
00037 
00038 #ifndef TIGS_TIGSINPUTFRAME_C_DEFINED
00039 #define TIGS_TIGSINPUTFRAME_C_DEFINED
00040 
00041 #include "TIGS/TigsInputFrame.H"
00042 
00043 #include "Image/ColorOps.H"
00044 #include "Util/StringConversions.H"
00045 #include "rutz/trace.h"
00046 
00047 #include <sstream>
00048 
00049 // specialization of rescale() for PixRGB<byte>; here we unpack the
00050 // PixRGB operations so that they can be better optimized by the
00051 // compiler for at least a 2x speedup -- unfortunately (with gcc
00052 // anyway) the overloaded PixRGB operators (i.e. PixRGB+PixRGB,
00053 // PixRGB*float, etc.) make for slow code, so here we unpack things
00054 // and do the interpolation one element at a time using builtin,
00055 // scalar arithmetic only
00056 Image<PixRGB<float> > rescaleAndPromote(const Image<PixRGB<byte> >& src,
00057                                         const int new_w, const int new_h)
00058 {
00059 GVX_TRACE(__PRETTY_FUNCTION__);
00060 
00061   ASSERT(src.initialized()); ASSERT(new_w > 0 && new_h > 0);
00062 
00063   const int orig_w = src.getWidth();
00064   const int orig_h = src.getHeight();
00065 
00066   // check if same size already
00067   if (new_w == orig_w && new_h == orig_h) return src;
00068 
00069   const float sw = float(orig_w) / float(new_w);
00070   const float sh = float(orig_h) / float(new_h);
00071 
00072   Image<PixRGB<float> > result(new_w, new_h, NO_INIT);
00073   Image<PixRGB<float> >::iterator dptr = result.beginw();
00074   Image<PixRGB<byte> >::const_iterator const sptr = src.begin();
00075 
00076   for (int j = 0; j < new_h; ++j)
00077     {
00078       const float y = std::max(0.0f, (j+0.5f) * sh - 0.5f);
00079 
00080       const int y0 = int(y);
00081       const int y1 = std::min(y0 + 1, orig_h - 1);
00082 
00083       const float fy = y - float(y0);
00084 
00085       const int wy0 = orig_w * y0;
00086       const int wy1 = orig_w * y1;
00087 
00088       for (int i = 0; i < new_w; ++i)
00089         {
00090           const float x = std::max(0.0f, (i+0.5f) * sw - 0.5f);
00091 
00092           const int x0 = int(x);
00093           const int x1 = std::min(x0 + 1, orig_w - 1);
00094 
00095           const float fx = x - float(x0);
00096 
00097 #define RGB_BILINEAR_INTERP(EL)                                 \
00098   do {                                                          \
00099     const float                                                 \
00100       d00( sptr[x0 + wy0].p[EL] ), d10( sptr[x1 + wy0].p[EL] ), \
00101       d01( sptr[x0 + wy1].p[EL] ), d11( sptr[x1 + wy1].p[EL] ); \
00102                                                                 \
00103     const float                                                 \
00104       dx0( d00 + (d10 - d00) * fx ),                            \
00105       dx1( d01 + (d11 - d01) * fx );                            \
00106                                                                 \
00107     dptr->p[EL] = float( int( dx0 + (dx1 - dx0) * fy ) );       \
00108   } while(0)
00109 
00110           // yes, I'm doing that funny float(byte()) conversion on
00111           // purpose, in order to maintain backward compatibility with
00112           // when I used to do
00113           // Image<PixRGB<float>>(rescale(byteimage))
00114 
00115           RGB_BILINEAR_INTERP(0);
00116           RGB_BILINEAR_INTERP(1);
00117           RGB_BILINEAR_INTERP(2);
00118 
00119 #undef RGB_BILINEAR_INTERP
00120 
00121           ++dptr;
00122         }
00123     }
00124   return result;
00125 }
00126 
00127 rutz::shared_ptr<TigsInputFrame>
00128 TigsInputFrame::fromGhostString(const std::string& s)
00129 {
00130   std::istringstream iss(s);
00131   int64 nanosecs;
00132   std::string dimsstr;
00133   std::string hashstr;
00134   iss >> nanosecs >> dimsstr >> hashstr;
00135 
00136   const Dims dims = fromStr<Dims>(dimsstr);
00137   const Digest<16> hash = Digest<16>::fromString(hashstr);
00138 
00139   return rutz::shared_ptr<TigsInputFrame>
00140     (new TigsInputFrame(SimTime::NSECS(nanosecs), dims, hash));
00141 }
00142 
00143 std::string TigsInputFrame::toGhostString() const
00144 {
00145   std::ostringstream oss;
00146   oss << itsTime.nsecs()
00147       << ' ' << convertToString(itsOrigbounds.dims())
00148       << ' ' << this->getHash().asString();
00149   return oss.str();
00150 }
00151 
00152 void TigsInputFrame::initialize() const
00153 {
00154   if (itsLum.initialized()
00155       && itsRG.initialized()
00156       && itsBY.initialized()
00157       && itsRGB.initialized())
00158     return;
00159 
00160   GVX_TRACE(__PRETTY_FUNCTION__);
00161 
00162   const Image<PixRGB<float> > fframe =
00163     rescaleAndPromote(itsOrigframe, 512, 512);
00164 
00165   itsRGB = Image<PixRGB<byte> >(fframe);
00166 
00167   itsLum = luminance(fframe);
00168 
00169   getRGBYsimple(fframe, itsRG, itsBY, float(5.0f));
00170 
00171   {GVX_TRACE("re-range");
00172   itsRG += 1.0f;
00173   itsBY += 1.0f;
00174   itsRG *= 127.5f;
00175   itsBY *= 127.5f;
00176   }
00177 }
00178 
00179 // ######################################################################
00180 /* So things look consistent in everyone's emacs... */
00181 /* Local Variables: */
00182 /* mode: c++ */
00183 /* indent-tabs-mode: nil */
00184 /* End: */
00185 
00186 #endif // TIGS_TIGSINPUTFRAME_C_DEFINED