00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022
00023
00024
00025
00026
00027
00028
00029
00030
00031
00032
00033
00034
00035
00036
00037
00038
00039
00040
00041
00042
00043
00044
00045
00046 #include "Channels/ChannelOpts.H"
00047 #include "Component/GlobalOpts.H"
00048 #include "Component/ModelManager.H"
00049 #include "Component/ModelOptionDef.H"
00050 #include "Devices/FrameGrabberConfigurator.H"
00051 #include "GUI/XWinManaged.H"
00052 #include "Gist/FFN.H"
00053 #include "Gist/trainUtils.H"
00054 #include "Image/ColorOps.H"
00055 #include "Image/CutPaste.H"
00056 #include "Image/DrawOps.H"
00057 #include "Image/ImageCache.H"
00058 #include "Image/MathOps.H"
00059 #include "Image/MatrixOps.H"
00060 #include "Image/Pixels.H"
00061 #include "Image/Transforms.H"
00062 #include "Media/MPEGStream.H"
00063 #include "Media/MediaOpts.H"
00064 #include "Media/MediaSimEvents.H"
00065 #include "Neuro/GistEstimatorStd.H"
00066 #include "Neuro/NeuroOpts.H"
00067 #include "Neuro/NeuroSimEvents.H"
00068 #include "Neuro/ShapeEstimator.H"
00069 #include "Neuro/ShapeEstimatorModes.H"
00070 #include "Neuro/SpatialMetrics.H"
00071 #include "Neuro/StdBrain.H"
00072 #include "Neuro/gistParams.H"
00073 #include "Raster/Raster.H"
00074 #include "SIFT/Histogram.H"
00075 #include "Transport/FrameIstream.H"
00076 #include "Util/Timer.H"
00077 #include "Beobot/GridMap.H"
00078
00079 #include "Simulation/SimEventQueueConfigurator.H"
00080
00081
00082 #define W_ASPECT_RATIO 320 // ideal minimum width for display
00083 #define H_ASPECT_RATIO 240 // ideal minimum height for display
00084
00085 CloseButtonListener wList;
00086 XWinManaged *inputWin;
00087 XWinManaged *salWin;
00088
00089 XWinManaged *dispWin;
00090 int wDisp, hDisp, sDisp, scaleDisp;
00091 int wDispWin, hDispWin;
00092
00093
00094 int pcaW = 16, pcaH = 5;
00095 int winBarW = 5, winBarH = 25;
00096
00097
00098 void setupDispWin(int w, int h);
00099
00100 Image< PixRGB<byte> > getDispImg
00101 (Image< PixRGB<byte> > img, Image<float> gistImg,
00102 Image<float> gistPcaImg, Image<float> outHistImg);
00103
00104
00105
00106 int main(const int argc, const char **argv)
00107 {
00108 MYLOGVERB = LOG_INFO;
00109
00110
00111 ModelManager manager("Beobot: Navigation Model");
00112
00113
00114
00115 manager.allowOptions(OPTEXP_ALL & (~OPTEXP_SAVE));
00116
00117
00118 nub::soft_ref<SimEventQueueConfigurator>
00119 seqc(new SimEventQueueConfigurator(manager));
00120 manager.addSubComponent(seqc);
00121
00122 nub::soft_ref<FrameGrabberConfigurator>
00123 gbc(new FrameGrabberConfigurator(manager));
00124 manager.addSubComponent(gbc);
00125
00126 nub::soft_ref<StdBrain> brain(new StdBrain(manager));
00127 manager.addSubComponent(brain);
00128
00129 nub::ref<SpatialMetrics> metrics(new SpatialMetrics(manager));
00130 manager.addSubComponent(metrics);
00131
00132 manager.exportOptions(MC_RECURSE);
00133 metrics->setFOAradius(30);
00134 metrics->setFoveaRadius(30);
00135 manager.setOptionValString(&OPT_MaxNormType, "FancyOne");
00136 manager.setOptionValString(&OPT_UseRandom, "false");
00137
00138
00139 manager.setOptionValString(&OPT_ShapeEstimatorMode, "FeatureMap");
00140 manager.setOptionValString(&OPT_ShapeEstimatorSmoothMethod, "Chamfer");
00141
00142 manager.setOptionValString(&OPT_RawVisualCortexChans,"OIC");
00143
00144 manager.setOptionValString(&OPT_IORtype, "Disc");
00145
00146
00147 manager.setOptionValString(&OPT_GistEstimatorType,"Std");
00148
00149
00150 REQUEST_OPTIONALIAS_NEURO(manager);
00151
00152
00153 if (manager.parseCommandLine(argc, argv, "<input_train.txt>",
00154 1, 1) == false)
00155 return(1);
00156
00157
00158 nub::soft_ref<FrameIstream> gb = gbc->getFrameGrabber();
00159 if (gb.isInvalid())
00160 LFATAL("You need to select a frame grabber type via the "
00161 "--fg-type=XX command-line option for this program "
00162 "to be useful -- ABORT");
00163 int w = gb->getWidth(), h = gb->getHeight();
00164 std::string dims = convertToString(Dims(w, h));
00165 manager.setOptionValString(&OPT_InputFrameDims, dims);
00166 nub::soft_ref<SimEventQueue> seq = seqc->getQ();
00167
00168
00169 double fdelay = 33.3667/1000.0;
00170
00171
00172 manager.start();
00173
00174
00175 SimTime prevstime = SimTime::ZERO();
00176 int fNum = 0;
00177 Image< PixRGB<byte> > inputImg;
00178 Image< PixRGB<byte> > dispImg;
00179 Image< PixRGB<byte> > tImg;
00180
00181
00182
00183 rutz::shared_ptr<FeedForwardNetwork> ffn_place(new FeedForwardNetwork());
00184 FFNtrainInfo pcInfo(manager.getExtraArg(0).c_str());
00185 ffn_place->init3L(pcInfo.h1Name, pcInfo.h2Name, pcInfo.oName,
00186 pcInfo.redFeatSize, pcInfo.h1size, pcInfo.h2size,
00187 pcInfo.nOutput, 0.0, 0.0);
00188
00189
00190 Image<double> pcaVec =
00191 setupPcaIcaMatrix(pcInfo.trainFolder+pcInfo.evecFname,
00192 pcInfo.oriFeatSize, pcInfo.redFeatSize);
00193
00194
00195 gb->startStream();
00196
00197
00198 while(1)
00199 {
00200
00201
00202 if (fNum == 0 ||
00203 ((seq->now() - 0.5 * (prevstime - seq->now())).secs() - fNum * fdelay
00204 > fdelay))
00205 {
00206
00207
00208
00209
00210 inputImg = gb->readRGB();
00211 tImg = inputImg;
00212
00213
00214
00215 if (fNum == 0) setupDispWin(w, h);
00216
00217
00218
00219 seq->post(rutz::make_shared(new SimEventInputFrame(brain.get(), GenericFrame(inputImg), 0)));
00220 LINFO("\nnew frame :%d",fNum);
00221
00222
00223 Image<double> cgist;
00224 if (SeC<SimEventGistOutput> ee = seq->check<SimEventGistOutput>(brain.get())) cgist = ee->gv();
00225 else LFATAL("No gist output in the queue");
00226
00227
00228 Image<double> in;
00229 if(pcInfo.isPCA) in = matrixMult(pcaVec, cgist);
00230 else in = cgist;
00231
00232
00233 ffn_place->run3L(in);
00234 rutz::shared_ptr<Histogram> resHist(new Histogram(pcInfo.nOutput));
00235
00236 for(uint i = 0; i < pcInfo.nOutput; i++)
00237 {
00238 LINFO("pl[%3d]: %.4f",i,ffn_place->getOutput().getVal(i));
00239 resHist->addValue(i,ffn_place->getOutput().getVal(i));
00240 }
00241
00242
00243 LFATAL("FIXME SimEventGistOutput does not contain an image and should be updated");
00244
00245
00246
00247
00248
00249
00250
00251
00252
00253 dispWin->drawImage(dispImg,0,0);
00254 Raster::waitForKey();
00255
00256
00257
00258
00259
00260
00261
00262
00263
00264
00265
00266 fNum++;
00267 }
00268
00269
00270 prevstime = seq->now();
00271 const SimStatus status = seq->evolve();
00272
00273
00274 if (SeC<SimEventWTAwinner> e = seq->check<SimEventWTAwinner>(0))
00275 {
00276 const Point2D<int> winner = e->winner().p;
00277
00278
00279 Image<float> fmask; std::string label;
00280 if (SeC<SimEventShapeEstimatorOutput>
00281 e = seq->check<SimEventShapeEstimatorOutput>(0))
00282 { fmask = e->smoothMask(); label = e->winningLabel(); }
00283
00284 Image<float> roiImg;
00285 if (fmask.initialized())
00286 roiImg = fmask * luminance(inputImg);
00287 else
00288 roiImg = luminance(inputImg);
00289
00290 drawCircle(roiImg, winner, 10, 0.0f, 1);
00291 LINFO("\nFrame: %d, winner: (%d,%d) in %s\n\n",
00292 fNum, winner.i, winner.j, label.c_str());
00293
00294
00295
00296 }
00297
00298 if (SIM_BREAK == status)
00299 break;
00300 }
00301
00302
00303 manager.stop();
00304
00305
00306 return 0;
00307 }
00308
00309
00310
00311 void setupDispWin(int w, int h)
00312 {
00313
00314
00315
00316
00317 scaleDisp = 1;
00318 while (w*scaleDisp < W_ASPECT_RATIO*.75 && h*scaleDisp < H_ASPECT_RATIO*.75)
00319 scaleDisp++;
00320
00321
00322
00323 wDisp = w*scaleDisp; hDisp = h*scaleDisp;
00324 if(wDisp/(0.0 + W_ASPECT_RATIO) > hDisp/(0.0 + H_ASPECT_RATIO))
00325 hDisp = (int)(wDisp / (0.0 + W_ASPECT_RATIO) * H_ASPECT_RATIO)+1;
00326 else
00327 wDisp = (int)(hDisp / (0.0 + H_ASPECT_RATIO) * W_ASPECT_RATIO)+1;
00328
00329
00330 sDisp = (hDisp/NUM_GIST_FEAT + 1);
00331 hDisp = sDisp * NUM_GIST_FEAT;
00332
00333
00334 wDispWin = wDisp + sDisp * NUM_GIST_COL;
00335 hDispWin = hDisp + sDisp * pcaH * 2;
00336
00337 dispWin = new XWinManaged(Dims(wDispWin, hDispWin), 0, 0, "dispImg");
00338 wList.add(dispWin);
00339
00340 inputWin = new XWinManaged(Dims(w, h), w, 0, "input" );
00341 wList.add(inputWin);
00342
00343 salWin = new XWinManaged(Dims(w, h), 2*w, 0, "Sal" );
00344 wList.add(salWin);
00345 }
00346
00347
00348
00349 Image< PixRGB<byte> > getDispImg (Image< PixRGB<byte> > img,
00350 Image<float> gistImg,
00351 Image<float> gistPcaImg,
00352 Image<float> outHistImg)
00353 {
00354 Image< PixRGB<byte> > dispImg(wDispWin, hDispWin, ZEROS);
00355 int w = img.getWidth(); int h = img.getHeight();
00356
00357
00358 drawGrid(img, w/4,h/4,1,1,PixRGB<byte>(255,255,255));
00359 inplacePaste(dispImg, img, Point2D<int>(0, 0));
00360
00361
00362 inplaceNormalize(gistImg, 0.0f, 255.0f);
00363 inplacePaste(dispImg, Image<PixRGB<byte> >(gistImg), Point2D<int>(wDisp, 0));
00364
00365
00366 inplaceNormalize(gistPcaImg, 0.0f, 255.0f);
00367 inplacePaste(dispImg, Image<PixRGB<byte> >(gistPcaImg), Point2D<int>(wDisp, hDisp));
00368
00369
00370 inplaceNormalize(outHistImg, 0.0f, 255.0f);
00371 inplacePaste(dispImg, Image<PixRGB<byte> >(outHistImg), Point2D<int>(0, hDisp));
00372
00373
00374 drawLine(dispImg, Point2D<int>(0,hDisp),
00375 Point2D<int>(wDispWin,hDisp),
00376 PixRGB<byte>(255,255,255),1);
00377 drawLine(dispImg, Point2D<int>(wDisp-1,0),
00378 Point2D<int>(wDisp-1,hDispWin-1),
00379 PixRGB<byte>(255,255,255),1);
00380 return dispImg;
00381 }
00382
00383
00384
00385
00386
00387