Visual Servoing Platform version 3.7.0
Loading...
Searching...
No Matches
testGenericTrackerDepth.cpp
1/*
2 * ViSP, open source Visual Servoing Platform software.
3 * Copyright (C) 2005 - 2024 by Inria. All rights reserved.
4 *
5 * This software is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 * See the file LICENSE.txt at the root directory of this source
10 * distribution for additional information about the GNU GPL.
11 *
12 * For using ViSP with software that can not be combined with the GNU
13 * GPL, please contact Inria about acquiring a ViSP Professional
14 * Edition License.
15 *
16 * See https://visp.inria.fr for more information.
17 *
18 * This software was developed at:
19 * Inria Rennes - Bretagne Atlantique
20 * Campus Universitaire de Beaulieu
21 * 35042 Rennes Cedex
22 * France
23 *
24 * If you have questions regarding the use of this file, please contact
25 * Inria at visp@inria.fr
26 *
27 * This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
28 * WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
29 *
30 * Description:
31 * Regression test for depth MBT.
32 */
33
39
40#include <cstdlib>
41#include <iostream>
42#include <visp3/core/vpConfig.h>
43
44#if defined(VISP_HAVE_MODULE_MBT) && (defined(VISP_HAVE_LAPACK) || defined(VISP_HAVE_EIGEN3) || defined(VISP_HAVE_OPENCV))
45
46#if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)
47#include <type_traits>
48#endif
49
50#include <visp3/core/vpIoTools.h>
51#include <visp3/gui/vpDisplayD3D.h>
52#include <visp3/gui/vpDisplayGDI.h>
53#include <visp3/gui/vpDisplayGTK.h>
54#include <visp3/gui/vpDisplayOpenCV.h>
55#include <visp3/gui/vpDisplayX.h>
56#include <visp3/io/vpImageIo.h>
57#include <visp3/io/vpParseArgv.h>
58#include <visp3/mbt/vpMbGenericTracker.h>
59
60#define GETOPTARGS "i:dcle:mCh"
61
62#ifdef ENABLE_VISP_NAMESPACE
63using namespace VISP_NAMESPACE_NAME;
64#endif
65
66namespace
67{
68void usage(const char *name, const char *badparam)
69{
70 fprintf(stdout, "\n\
71 Regression test for vpGenericTracker and depth.\n\
72 \n\
73 SYNOPSIS\n\
74 %s [-i <test image path>] [-c] [-d] [-h] [-l] \n\
75 [-e <last frame index>] [-m] [-C]\n",
76 name);
77
78 fprintf(stdout, "\n\
79 OPTIONS: \n\
80 -i <input image path> \n\
81 Set image input path.\n\
82 These images come from ViSP-images-x.y.z.tar.gz available \n\
83 on the ViSP website.\n\
84 Setting the VISP_INPUT_IMAGE_PATH environment\n\
85 variable produces the same behavior than using\n\
86 this option.\n\
87 \n\
88 -d \n\
89 Turn off the display.\n\
90 \n\
91 -c\n\
92 Disable the mouse click. Useful to automate the \n\
93 execution of this program without human intervention.\n\
94 \n\
95 -l\n\
96 Use the scanline for visibility tests.\n\
97 \n\
98 -e <last frame index>\n\
99 Specify the index of the last frame. Once reached, the tracking is stopped.\n\
100 \n\
101 -m \n\
102 Set a tracking mask.\n\
103 \n\
104 -C \n\
105 Use color images.\n\
106 \n\
107 -h \n\
108 Print the help.\n\n");
109
110 if (badparam)
111 fprintf(stdout, "\nERROR: Bad parameter [%s]\n", badparam);
112}
113
114bool getOptions(int argc, const char **argv, std::string &ipath, bool &click_allowed, bool &display, bool &useScanline,
115 int &lastFrame, bool &use_mask, bool &use_color_image)
116{
117 const char *optarg_;
118 int c;
119 while ((c = vpParseArgv::parse(argc, argv, GETOPTARGS, &optarg_)) > 1) {
120
121 switch (c) {
122 case 'i':
123 ipath = optarg_;
124 break;
125 case 'c':
126 click_allowed = false;
127 break;
128 case 'd':
129 display = false;
130 break;
131 case 'l':
132 useScanline = true;
133 break;
134 case 'e':
135 lastFrame = atoi(optarg_);
136 break;
137 case 'm':
138 use_mask = true;
139 break;
140 case 'C':
141 use_color_image = true;
142 break;
143 case 'h':
144 usage(argv[0], nullptr);
145 return false;
146
147 default:
148 usage(argv[0], optarg_);
149 return false;
150 }
151 }
152
153 if ((c == 1) || (c == -1)) {
154 // standalone param or error
155 usage(argv[0], nullptr);
156 std::cerr << "ERROR: " << std::endl;
157 std::cerr << " Bad argument " << optarg_ << std::endl << std::endl;
158 return false;
159 }
160
161 return true;
162}
163
164template <typename Type>
165bool read_data(const std::string &input_directory, int cpt, const vpCameraParameters &cam_depth, vpImage<Type> &I,
166 vpImage<uint16_t> &I_depth, std::vector<vpColVector> &pointcloud, vpHomogeneousMatrix &cMo)
167{
168#if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)
169 static_assert(std::is_same<Type, unsigned char>::value || std::is_same<Type, vpRGBa>::value,
170 "Template function supports only unsigned char and vpRGBa images!");
171#endif
172#if defined(VISP_HAVE_DATASET)
173#if VISP_HAVE_DATASET_VERSION >= 0x030600
174 std::string ext("png");
175#else
176 std::string ext("pgm");
177#endif
178#else
179 // We suppose that the user will download a recent dataset
180 std::string ext("png");
181#endif
182 std::string image_filename = vpIoTools::formatString(input_directory + "/Images/Image_%04d." + ext, cpt);
183 std::string depth_filename = vpIoTools::formatString(input_directory + "/Depth/Depth_%04d.bin", cpt);
184 std::string pose_filename = vpIoTools::formatString(input_directory + "/CameraPose/Camera_%03d.txt", cpt);
185
186 if (!vpIoTools::checkFilename(image_filename) || !vpIoTools::checkFilename(depth_filename) ||
187 !vpIoTools::checkFilename(pose_filename))
188 return false;
189
190 vpImageIo::read(I, image_filename);
191
192 unsigned int depth_width = 0, depth_height = 0;
193 std::ifstream file_depth(depth_filename.c_str(), std::ios::in | std::ios::binary);
194 if (!file_depth.is_open())
195 return false;
196
197 vpIoTools::readBinaryValueLE(file_depth, depth_height);
198 vpIoTools::readBinaryValueLE(file_depth, depth_width);
199 I_depth.resize(depth_height, depth_width);
200 pointcloud.resize(depth_height * depth_width);
201
202 const float depth_scale = 0.000030518f;
203 for (unsigned int i = 0; i < I_depth.getHeight(); i++) {
204 for (unsigned int j = 0; j < I_depth.getWidth(); j++) {
205 vpIoTools::readBinaryValueLE(file_depth, I_depth[i][j]);
206 double x = 0.0, y = 0.0, Z = I_depth[i][j] * depth_scale;
207 vpPixelMeterConversion::convertPoint(cam_depth, j, i, x, y);
208 vpColVector pt3d(4, 1.0);
209 pt3d[0] = x * Z;
210 pt3d[1] = y * Z;
211 pt3d[2] = Z;
212 pointcloud[i * I_depth.getWidth() + j] = pt3d;
213 }
214 }
215
216 std::ifstream file_pose(pose_filename.c_str());
217 if (!file_pose.is_open()) {
218 return false;
219 }
220
221 for (unsigned int i = 0; i < 4; i++) {
222 for (unsigned int j = 0; j < 4; j++) {
223 file_pose >> cMo[i][j];
224 }
225 }
226
227 return true;
228}
229
230template <typename Type>
231bool run(vpImage<Type> &I, const std::string &input_directory, bool opt_click_allowed, bool opt_display,
232 bool useScanline, int opt_lastFrame, bool use_mask)
233{
234#if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)
235 static_assert(std::is_same<Type, unsigned char>::value || std::is_same<Type, vpRGBa>::value,
236 "Template function supports only unsigned char and vpRGBa images!");
237#endif
238// Initialise a display
239#if defined(VISP_HAVE_X11)
240 vpDisplayX display1, display2;
241#elif defined(VISP_HAVE_GDI)
242 vpDisplayGDI display1, display2;
243#elif defined(HAVE_OPENCV_HIGHGUI)
244 vpDisplayOpenCV display1, display2;
245#elif defined(VISP_HAVE_D3D9)
246 vpDisplayD3D display1, display2;
247#elif defined(VISP_HAVE_GTK)
248 vpDisplayGTK display1, display2;
249#else
250 opt_display = false;
251#endif
252
253 std::vector<int> tracker_type;
254 tracker_type.push_back(vpMbGenericTracker::DEPTH_DENSE_TRACKER);
255 vpMbGenericTracker tracker(tracker_type);
256
257#if defined(VISP_HAVE_PUGIXML)
258 tracker.loadConfigFile(input_directory + "/Config/chateau_depth.xml");
259#else
260 // Corresponding parameters manually set to have an example code
261 {
263 cam_depth.initPersProjWithoutDistortion(700.0, 700.0, 320.0, 240.0);
264 tracker.setCameraParameters(cam_depth);
265 }
266 // Depth
267 tracker.setDepthNormalFeatureEstimationMethod(vpMbtFaceDepthNormal::ROBUST_FEATURE_ESTIMATION);
268 tracker.setDepthNormalPclPlaneEstimationMethod(2);
269 tracker.setDepthNormalPclPlaneEstimationRansacMaxIter(200);
270 tracker.setDepthNormalPclPlaneEstimationRansacThreshold(0.001);
271 tracker.setDepthNormalSamplingStep(2, 2);
272
273 tracker.setDepthDenseSamplingStep(4, 4);
274
275#if defined(VISP_HAVE_MODULE_KLT) && defined(VISP_HAVE_OPENCV) && defined(HAVE_OPENCV_IMGPROC) && defined(HAVE_OPENCV_VIDEO)
276 tracker.setKltMaskBorder(5);
277#endif
278
279 tracker.setAngleAppear(vpMath::rad(85.0));
280 tracker.setAngleDisappear(vpMath::rad(89.0));
281 tracker.setNearClippingDistance(0.01);
282 tracker.setFarClippingDistance(2.0);
283 tracker.setClipping(tracker.getClipping() | vpMbtPolygon::FOV_CLIPPING);
284#endif
285 tracker.loadModel(input_directory + "/Models/chateau.cao");
287 T[0][0] = -1;
288 T[0][3] = -0.2;
289 T[1][1] = 0;
290 T[1][2] = 1;
291 T[1][3] = 0.12;
292 T[2][1] = 1;
293 T[2][2] = 0;
294 T[2][3] = -0.15;
295 tracker.loadModel(input_directory + "/Models/cube.cao", false, T);
297 tracker.getCameraParameters(cam_depth);
298 tracker.setDisplayFeatures(true);
299 tracker.setScanLineVisibilityTest(useScanline);
300
301 vpImage<uint16_t> I_depth_raw;
303 vpHomogeneousMatrix cMo_truth;
304 std::vector<vpColVector> pointcloud;
305 int cpt_frame = 1;
306 if (!read_data(input_directory, cpt_frame, cam_depth, I, I_depth_raw, pointcloud, cMo_truth)) {
307 std::cerr << "Cannot read first frame!" << std::endl;
308 return EXIT_FAILURE;
309 }
310
311 vpImage<bool> mask(I.getHeight(), I.getWidth());
312 const double roi_step = 7.0;
313 const double roi_step2 = 6.0;
314 if (use_mask) {
315 mask = false;
316 for (unsigned int i = static_cast<unsigned int>(I.getRows() / roi_step);
317 i < static_cast<unsigned int>(I.getRows() * roi_step2 / roi_step); i++) {
318 for (unsigned int j = static_cast<unsigned int>(I.getCols() / roi_step);
319 j < static_cast<unsigned int>(I.getCols() * roi_step2 / roi_step); j++) {
320 mask[i][j] = true;
321 }
322 }
323 tracker.setMask(mask);
324 }
325
326 vpImageConvert::createDepthHistogram(I_depth_raw, I_depth);
327 if (opt_display) {
328#ifdef VISP_HAVE_DISPLAY
329 display1.init(I, 0, 0, "Image");
330 display2.init(I_depth, static_cast<int>(I.getWidth()), 0, "Depth");
331#endif
332 }
333
335 depth_M_color[0][3] = -0.05;
336 tracker.initFromPose(I, depth_M_color * cMo_truth);
337
338 bool click = false, quit = false, correct_accuracy = true;
339 std::vector<double> vec_err_t, vec_err_tu;
340 std::vector<double> time_vec;
341 while (read_data(input_directory, cpt_frame, cam_depth, I, I_depth_raw, pointcloud, cMo_truth) && !quit &&
342 (opt_lastFrame > 0 ? static_cast<int>(cpt_frame) <= opt_lastFrame : true)) {
343 vpImageConvert::createDepthHistogram(I_depth_raw, I_depth);
344
345 if (opt_display) {
347 vpDisplay::display(I_depth);
348 }
349
350 double t = vpTime::measureTimeMs();
351 std::map<std::string, const vpImage<Type> *> mapOfImages;
352 std::map<std::string, const std::vector<vpColVector> *> mapOfPointclouds;
353 mapOfPointclouds["Camera"] = &pointcloud;
354 std::map<std::string, unsigned int> mapOfWidths, mapOfHeights;
355 mapOfWidths["Camera"] = I_depth.getWidth();
356 mapOfHeights["Camera"] = I_depth.getHeight();
357
358 tracker.track(mapOfImages, mapOfPointclouds, mapOfWidths, mapOfHeights);
359 vpHomogeneousMatrix cMo = tracker.getPose();
361 time_vec.push_back(t);
362
363 if (opt_display) {
364 tracker.display(I_depth, cMo, cam_depth, vpColor::red, 3);
365 vpDisplay::displayFrame(I_depth, cMo, cam_depth, 0.05, vpColor::none, 3);
366
367 std::stringstream ss;
368 ss << "Frame: " << cpt_frame;
369 vpDisplay::displayText(I_depth, 20, 20, ss.str(), vpColor::red);
370 ss.str("");
371 ss << "Nb features: " << tracker.getError().getRows();
372 vpDisplay::displayText(I_depth, 40, 20, ss.str(), vpColor::red);
373 }
374
375 vpPoseVector pose_est(cMo);
376 vpPoseVector pose_truth(depth_M_color * cMo_truth);
377 vpColVector t_est(3), t_truth(3);
378 vpColVector tu_est(3), tu_truth(3);
379 for (unsigned int i = 0; i < 3; i++) {
380 t_est[i] = pose_est[i];
381 t_truth[i] = pose_truth[i];
382 tu_est[i] = pose_est[i + 3];
383 tu_truth[i] = pose_truth[i + 3];
384 }
385
386 vpColVector t_err = t_truth - t_est, tu_err = tu_truth - tu_est;
387 double t_err2 = sqrt(t_err.sumSquare()), tu_err2 = vpMath::deg(sqrt(tu_err.sumSquare()));
388 vec_err_t.push_back(t_err2);
389 vec_err_tu.push_back(tu_err2);
390 const double t_thresh = useScanline ? 0.003 : 0.002;
391 const double tu_thresh = useScanline ? 0.5 : 0.4;
392 if (!use_mask && (t_err2 > t_thresh || tu_err2 > tu_thresh)) { // no accuracy test with mask
393 std::cerr << "Pose estimated exceeds the threshold (t_thresh = " << t_thresh << ", tu_thresh = " << tu_thresh
394 << ")!" << std::endl;
395 std::cout << "t_err: " << t_err2 << " ; tu_err: " << tu_err2 << std::endl;
396 correct_accuracy = false;
397 }
398
399 if (opt_display) {
400 if (use_mask) {
401 vpRect roi(vpImagePoint(I.getRows() / roi_step, I.getCols() / roi_step),
402 vpImagePoint(I.getRows() * roi_step2 / roi_step, I.getCols() * roi_step2 / roi_step));
404 }
405
407 vpDisplay::flush(I_depth);
408 }
409
410 if (opt_display && opt_click_allowed) {
412 if (vpDisplay::getClick(I, button, click)) {
413 switch (button) {
415 quit = !click;
416 break;
417
419 click = !click;
420 break;
421
422 default:
423 break;
424 }
425 }
426 }
427
428 cpt_frame++;
429 }
430
431 if (!time_vec.empty())
432 std::cout << "Computation time, Mean: " << vpMath::getMean(time_vec)
433 << " ms ; Median: " << vpMath::getMedian(time_vec) << " ms ; Std: " << vpMath::getStdev(time_vec) << " ms"
434 << std::endl;
435
436 if (!vec_err_t.empty())
437 std::cout << "Max translation error: " << *std::max_element(vec_err_t.begin(), vec_err_t.end()) << std::endl;
438
439 if (!vec_err_tu.empty())
440 std::cout << "Max thetau error: " << *std::max_element(vec_err_tu.begin(), vec_err_tu.end()) << std::endl;
441
442 return correct_accuracy ? EXIT_SUCCESS : EXIT_FAILURE;
443}
444} // namespace
445
446int main(int argc, const char *argv[])
447{
448 try {
449 std::string env_ipath;
450 std::string opt_ipath = "";
451 bool opt_click_allowed = true;
452 bool opt_display = true;
453 bool useScanline = false;
454#if defined(__mips__) || defined(__mips) || defined(mips) || defined(__MIPS__)
455 // To avoid Debian test timeout
456 int opt_lastFrame = 5;
457#else
458 int opt_lastFrame = -1;
459#endif
460 bool use_mask = false;
461 bool use_color_image = false;
462
463 // Get the visp-images-data package path or VISP_INPUT_IMAGE_PATH
464 // environment variable value
466
467 // Read the command line options
468 if (!getOptions(argc, argv, opt_ipath, opt_click_allowed, opt_display, useScanline, opt_lastFrame, use_mask,
469 use_color_image)) {
470 return EXIT_FAILURE;
471 }
472
473 std::cout << "useScanline: " << useScanline << std::endl;
474 std::cout << "use_mask: " << use_mask << std::endl;
475 std::cout << "use_color_image: " << use_color_image << std::endl;
476
477 // Test if an input path is set
478 if (opt_ipath.empty() && env_ipath.empty()) {
479 usage(argv[0], nullptr);
480 std::cerr << std::endl << "ERROR:" << std::endl;
481 std::cerr << " Use -i <visp image path> option or set VISP_INPUT_IMAGE_PATH " << std::endl
482 << " environment variable to specify the location of the " << std::endl
483 << " image path where test images are located." << std::endl
484 << std::endl;
485
486 return EXIT_FAILURE;
487 }
488
489 std::string input_directory =
490 vpIoTools::createFilePath(!opt_ipath.empty() ? opt_ipath : env_ipath, "mbt-depth/Castle-simu");
491 if (!vpIoTools::checkDirectory(input_directory)) {
492 std::cerr << "ViSP-images does not contain the folder: " << input_directory << "!" << std::endl;
493 return EXIT_SUCCESS;
494 }
495
496 if (use_color_image) {
497 vpImage<vpRGBa> I_color;
498 return run(I_color, input_directory, opt_click_allowed, opt_display, useScanline, opt_lastFrame, use_mask);
499 }
500 else {
502 return run(I_gray, input_directory, opt_click_allowed, opt_display, useScanline, opt_lastFrame, use_mask);
503 }
504 }
505 catch (const vpException &e) {
506 std::cout << "Catch an exception: " << e << std::endl;
507 return EXIT_FAILURE;
508 }
509}
510#elif !(defined(VISP_HAVE_LAPACK) || defined(VISP_HAVE_EIGEN3) || defined(VISP_HAVE_OPENCV))
511int main()
512{
513 std::cout << "Cannot run this example: install Lapack, Eigen3 or OpenCV" << std::endl;
514 return EXIT_SUCCESS;
515}
516#else
517int main()
518{
519 std::cout << "Enable MBT module (VISP_HAVE_MODULE_MBT) to launch this test." << std::endl;
520 return EXIT_SUCCESS;
521}
522#endif
Generic class defining intrinsic camera parameters.
Implementation of column vector and the associated operations.
double sumSquare() const
static const vpColor red
Definition vpColor.h:198
static const vpColor none
Definition vpColor.h:210
static const vpColor yellow
Definition vpColor.h:206
Display for windows using Direct3D 3rd party. Thus to enable this class Direct3D should be installed....
Display for windows using GDI (available on any windows 32 platform).
The vpDisplayGTK allows to display image using the GTK 3rd party library. Thus to enable this class G...
The vpDisplayOpenCV allows to display image using the OpenCV library. Thus to enable this class OpenC...
Use the X11 console to display images on unix-like OS. Thus to enable this class X11 should be instal...
Definition vpDisplayX.h:135
void init(vpImage< unsigned char > &I, int win_x=-1, int win_y=-1, const std::string &win_title="") VP_OVERRIDE
static bool getClick(const vpImage< unsigned char > &I, bool blocking=true)
static void display(const vpImage< unsigned char > &I)
static void displayFrame(const vpImage< unsigned char > &I, const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, double size, const vpColor &color=vpColor::none, unsigned int thickness=1, const vpImagePoint &offset=vpImagePoint(0, 0), const std::string &frameName="", const vpColor &textColor=vpColor::black, const vpImagePoint &textOffset=vpImagePoint(15, 15))
static void flush(const vpImage< unsigned char > &I)
static void displayRectangle(const vpImage< unsigned char > &I, const vpImagePoint &topLeft, unsigned int width, unsigned int height, const vpColor &color, bool fill=false, unsigned int thickness=1)
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
error that can be emitted by ViSP classes.
Definition vpException.h:60
Implementation of an homogeneous matrix and operations on such kind of matrices.
static void createDepthHistogram(const vpImage< uint16_t > &src_depth, vpImage< vpRGBa > &dest_rgba)
static void read(vpImage< unsigned char > &I, const std::string &filename, int backend=IO_DEFAULT_BACKEND)
Class that defines a 2D point in an image. This class is useful for image processing and stores only ...
Definition of the vpImage class member functions.
Definition vpImage.h:131
static std::string getViSPImagesDataPath()
static bool checkFilename(const std::string &filename)
static void readBinaryValueLE(std::ifstream &file, int16_t &short_value)
static bool checkDirectory(const std::string &dirname)
static std::string formatString(const std::string &name, unsigned int val)
static std::string createFilePath(const std::string &parent, const std::string &child)
static double rad(double deg)
Definition vpMath.h:129
static double getMedian(const std::vector< double > &v)
Definition vpMath.cpp:343
static double getStdev(const std::vector< double > &v, bool useBesselCorrection=false)
Definition vpMath.cpp:374
static double getMean(const std::vector< double > &v)
Definition vpMath.cpp:323
static double deg(double rad)
Definition vpMath.h:119
Real-time 6D object pose tracking using its CAD model.
@ ROBUST_FEATURE_ESTIMATION
Robust scheme to estimate the normal of the plane.
static bool parse(int *argcPtr, const char **argv, vpArgvInfo *argTable, int flags)
static void convertPoint(const vpCameraParameters &cam, const double &u, const double &v, double &x, double &y)
Implementation of a pose vector and operations on poses.
Defines a rectangle in the plane.
Definition vpRect.h:79
read_data(CameraParameters|None cam_depth, ImageGray I, rs.pipeline pipe)
VISP_EXPORT double measureTimeMs()