Visual Servoing Platform version 3.7.0
Loading...
Searching...
No Matches
tutorial-rbt-realsense.cpp
/*
* ViSP, open source Visual Servoing Platform software.
* Copyright (C) 2005 - 2024 by Inria. All rights reserved.
*
* This software is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
* See the file LICENSE.txt at the root directory of this source
* distribution for additional information about the GNU GPL.
*
* For using ViSP with software that can not be combined with the GNU
* GPL, please contact Inria about acquiring a ViSP Professional
* Edition License.
*
* See https://visp.inria.fr for more information.
*
* This software was developed at:
* Inria Rennes - Bretagne Atlantique
* Campus Universitaire de Beaulieu
* 35042 Rennes Cedex
* France
*
* If you have questions regarding the use of this file, please contact
* Inria at visp@inria.fr
*
* This file is provided AS IS with NO WARRANTY OF ANY KIND, INCLUDING THE
* WARRANTY OF DESIGN, MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
*/
#include <iostream>
#include <visp3/core/vpConfig.h>
#ifdef ENABLE_VISP_NAMESPACE
using namespace VISP_NAMESPACE_NAME;
#endif
#ifndef VISP_HAVE_REALSENSE2
int main()
{
std::cerr << "To run this tutorial, recompile ViSP with the Realsense third party library" << std::endl;
return EXIT_SUCCESS;
}
#else
#include <visp3/sensor/vpRealSense2.h>
#include <visp3/io/vpParseArgv.h>
#include <visp3/ar/vpPanda3DFrameworkManager.h>
#include <visp3/rbt/vpRBTracker.h>
#include "render-based-tutorial-utils.h"
#ifndef DOXYGEN_SHOULD_SKIP_THIS
{
CmdArguments() : height(480), width(848), fps(60)
{ }
void registerArguments(vpJsonArgumentParser &parser)
{
parser.addArgument("--height", height, false, "Realsense requested image height")
.addArgument("--width", width, false, "Realsense requested image width")
.addArgument("--fps", fps, false, "Realsense requested framerate");
}
unsigned int height, width, fps;
};
#endif
void updateDepth(const vpImage<uint16_t> &depthRaw, float depthScale, float maxZDisplay, vpImage<float> &depth, vpImage<unsigned char> &IdepthDisplay)
{
depth.resize(depthRaw.getHeight(), depthRaw.getWidth());
#ifdef VISP_HAVE_OPENMP
#pragma omp parallel for
#endif
for (int i = 0; i < static_cast<int>(depthRaw.getSize()); ++i) {
depth.bitmap[i] = depthScale * static_cast<float>(depthRaw.bitmap[i]);
IdepthDisplay.bitmap[i] = depth.bitmap[i] > maxZDisplay ? 0 : static_cast<unsigned int>((depth.bitmap[i] / maxZDisplay) * 255.f);
}
}
int main(int argc, const char **argv)
{
// Read the command line options
vpRBTrackerTutorial::BaseArguments baseArgs;
CmdArguments realsenseArgs;
vpRBTrackerTutorial::vpRBExperimentLogger logger;
vpRBTrackerTutorial::vpRBExperimentPlotter plotter;
"Tutorial showing the usage of the Render-Based tracker with a RealSense camera",
"--config", "/"
);
baseArgs.registerArguments(parser);
realsenseArgs.registerArguments(parser);
logger.registerArguments(parser);
plotter.registerArguments(parser);
parser.parse(argc, argv);
baseArgs.postProcessArguments();
plotter.postProcessArguments(baseArgs.display);
if (baseArgs.enableRenderProfiling) {
vpRBTrackerTutorial::enableRendererProfiling();
}
std::cout << "Loading tracker: " << baseArgs.trackerConfiguration << std::endl;
tracker.loadConfigurationFile(baseArgs.trackerConfiguration);
if (!baseArgs.modelPath.empty()) {
tracker.setModelPath(baseArgs.modelPath);
}
const unsigned int width = realsenseArgs.width, height = realsenseArgs.height;
const unsigned fps = realsenseArgs.fps;
vpRealSense2 realsense;
std::cout << "Opening realsense with settings: " << width << "x" << height << " @ " << fps << "fps" << std::endl;
rs2::config config;
config.enable_stream(RS2_STREAM_COLOR, width, height, RS2_FORMAT_RGBA8, fps);
config.enable_stream(RS2_STREAM_DEPTH, width, height, RS2_FORMAT_Z16, fps);
rs2::align align_to(RS2_STREAM_COLOR);
try {
realsense.open(config);
}
catch (const vpException &e) {
std::cout << "Caught an exception: " << e.what() << std::endl;
std::cout << "Check if the Realsense camera is connected..." << std::endl;
return EXIT_FAILURE;
}
const float depthScale = realsense.getDepthScale(); // used to convert uint16_t to meters
tracker.setCameraParameters(cam, height, width);
tracker.startTracking();
vpImage<vpRGBa> Icol(height, width); // Color image
vpImage<unsigned char> Id(height, width); // Grayscale image, converted from Icol
vpImage<uint16_t> depthRaw(height, width); // Raw depth map, in realsense format
vpImage<float> depth(height, width); // Depth map, in meters
// Display versions of raw image data
vpImage<unsigned char> IdepthDisplay(height, width);
vpImage<unsigned char> IProbaDisplay(height, width);
vpImage<unsigned char> cannyDisplay(height, width);
vpImage<vpRGBa> InormDisplay(height, width);
//camera warmup, colors may appear washed out in the first few frames
for (int i = 0; i < 10; ++i) {
realsense.acquire(Icol);
}
std::cout << "Creating displays..." << std::endl;
std::vector<std::shared_ptr<vpDisplay>> displays, displaysDebug;
if (baseArgs.display) {
displays = vpRBTrackerTutorial::createDisplays(Id, Icol, IdepthDisplay, IProbaDisplay);
if (baseArgs.debugDisplay) {
displaysDebug = vpDisplayFactory::makeDisplayGrid(1, 2,
0, 0,
20, 20,
"Normals in object frame", InormDisplay,
"Depth canny", cannyDisplay
);
}
plotter.init(displays);
}
if (baseArgs.display && !baseArgs.hasInlineInit()) {
bool ready = false;
while (!ready) {
realsense.acquire((unsigned char *)Icol.bitmap, (unsigned char *)depthRaw.bitmap, nullptr, nullptr, &align_to);
updateDepth(depthRaw, depthScale, baseArgs.maxDepthDisplay, depth, IdepthDisplay);
if (vpDisplay::getClick(Id, false)) {
ready = true;
}
else {
vpTime::wait(1000.0 / fps);
}
}
}
// Manual initialization of the tracker
std::cout << "Starting init" << std::endl;
if (baseArgs.hasInlineInit()) {
tracker.setPose(baseArgs.cMoInit);
}
else if (baseArgs.display) {
tracker.initClick(Id, baseArgs.initFile, true);
tracker.getPose(cMo);
}
else {
throw vpException(vpException::notImplementedError, "Cannot initialize tracking: no initial pose provided or display to perform click initialization.");
}
std::cout << "Starting pose: " << vpPoseVector(cMo).t() << std::endl;
if (baseArgs.display) {
}
logger.startLog();
unsigned int iter = 1;
// Main tracking loop
double expStart = vpTime::measureTimeMs();
while (true) {
double frameStart = vpTime::measureTimeMs();
// Acquire images
realsense.acquire((unsigned char *)Icol.bitmap, (unsigned char *)depthRaw.bitmap, nullptr, nullptr, &align_to);
updateDepth(depthRaw, depthScale, baseArgs.maxDepthDisplay, depth, IdepthDisplay);
double trackingStart = vpTime::measureTimeMs();
vpRBTrackingResult result = tracker.track(Id, Icol, depth);
double trackingEnd = vpTime::measureTimeMs();
tracker.getPose(cMo);
switch (result.getStoppingReason()) {
case vpRBTrackingStoppingReason::EXCEPTION:
{
std::cout << "Encountered an exception during tracking, pose was not updated!" << std::endl;
break;
}
case vpRBTrackingStoppingReason::NOT_ENOUGH_FEATURES:
{
std::cout << "There were not enough feature to perform tracking!" << std::endl;
break;
}
case vpRBTrackingStoppingReason::OBJECT_NOT_IN_IMAGE:
{
std::cout << "Object is not in image!" << std::endl;
break;
}
case vpRBTrackingStoppingReason::CONVERGENCE_CRITERION:
{
std::cout << "Convergence criterion reached:" << std::endl;
std::cout << "- Num iterations: " << result.getNumIterations() << std::endl;
std::cout << "- Convergence criterion: " << *(result.getConvergenceMetricValues().end() - 1) << std::endl;
break;
}
case vpRBTrackingStoppingReason::MAX_ITERS:
{
break;
}
default:
{ }
}
const std::shared_ptr<vpRBDriftDetector> driftDetector = tracker.getDriftDetector();
if (driftDetector) {
if (driftDetector->getScore() < 0.25) {
std::cout << "Drift detection has low confidence score: " << driftDetector->getScore() << std::endl;
}
}
double displayStart = vpTime::measureTimeMs();
if (baseArgs.display) {
if (baseArgs.debugDisplay) {
const vpRBFeatureTrackerInput &lastFrame = tracker.getMostRecentFrame();
vpRBTrackerTutorial::displayCanny(lastFrame.renders.silhouetteCanny, cannyDisplay, lastFrame.renders.isSilhouette);
}
tracker.display(Id, Icol, IdepthDisplay);
vpDisplay::displayFrame(Icol, cMo, cam, 0.05, vpColor::none, 2);
vpDisplay::displayText(Id, 20, 5, "Right click to exit", vpColor::red);
if (driftDetector) {
std::stringstream ss;
ss << "Confidence score: " << std::setprecision(2) << driftDetector->getScore() << std::endl;
vpDisplay::displayText(Id, Id.getHeight() - 40, 5, ss.str(), vpColor::red);
}
if (vpDisplay::getClick(Id, button, false)) {
if (button == vpMouseButton::button3) {
break;
}
}
tracker.displayMask(IProbaDisplay);
vpDisplay::display(IProbaDisplay);
vpDisplay::flush(IdepthDisplay); vpDisplay::flush(IProbaDisplay);
}
const double displayEnd = vpTime::measureTimeMs();
const double frameEnd = vpTime::measureTimeMs();
logger.logFrame(tracker, iter, Id, Icol, IdepthDisplay, IProbaDisplay);
std::cout << "Iter " << iter << ": " << round(frameEnd - frameStart) << "ms" << std::endl;
std::cout << "- Tracking: " << round(trackingEnd - trackingStart) << "ms" << std::endl;
std::cout << "- Display: " << round(displayEnd - displayStart) << "ms" << std::endl;
if (baseArgs.verbose) {
std::cout << result.timer() << std::endl;
}
plotter.plot(tracker, (frameEnd - expStart) / 1000.0);
iter++;
}
logger.close();
return EXIT_SUCCESS;
}
#endif
Generic class defining intrinsic camera parameters.
@ perspectiveProjWithoutDistortion
Perspective projection without distortion model.
static const vpColor red
Definition vpColor.h:198
static const vpColor none
Definition vpColor.h:210
static bool getClick(const vpImage< unsigned char > &I, bool blocking=true)
static void display(const vpImage< unsigned char > &I)
static void displayFrame(const vpImage< unsigned char > &I, const vpHomogeneousMatrix &cMo, const vpCameraParameters &cam, double size, const vpColor &color=vpColor::none, unsigned int thickness=1, const vpImagePoint &offset=vpImagePoint(0, 0), const std::string &frameName="", const vpColor &textColor=vpColor::black, const vpImagePoint &textOffset=vpImagePoint(15, 15))
static void flush(const vpImage< unsigned char > &I)
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
error that can be emitted by ViSP classes.
Definition vpException.h:60
@ notImplementedError
Not implemented.
Definition vpException.h:69
Implementation of an homogeneous matrix and operations on such kind of matrices.
static void convert(const vpImage< unsigned char > &src, vpImage< vpRGBa > &dest)
Definition of the vpImage class member functions.
Definition vpImage.h:131
unsigned int getWidth() const
Definition vpImage.h:242
unsigned int getSize() const
Definition vpImage.h:221
Type * bitmap
points toward the bitmap
Definition vpImage.h:135
unsigned int getHeight() const
Definition vpImage.h:181
Command line argument parsing with support for JSON files. If a JSON file is supplied,...
static vpPanda3DFrameworkManager & getInstance()
Implementation of a pose vector and operations on poses.
vpRowVector t() const
All the data related to a single tracking frame. This contains both the input data (from a real camer...
vpRBRenderData renders
camera parameters
Class implementing the Render-Based Tracker (RBT).
Definition vpRBTracker.h:87
vpRBTrackingStoppingReason getStoppingReason() const
vpRBTrackingTimings & timer()
const std::vector< double > & getConvergenceMetricValues() const
unsigned int getNumIterations() const
vpCameraParameters getCameraParameters(const rs2_stream &stream, vpCameraParameters::vpCameraParametersProjType type=vpCameraParameters::perspectiveProjWithDistortion, int index=-1) const
void acquire(vpImage< unsigned char > &grey, double *ts=nullptr)
bool open(const rs2::config &cfg=rs2::config())
float getDepthScale()
std::vector< std::shared_ptr< vpDisplay > > makeDisplayGrid(unsigned int rows, unsigned int cols, unsigned int startX, unsigned int startY, unsigned int paddingX, unsigned int paddingY, Args &... args)
Create a grid of displays, given a set of images. All the displays will be initialized in the correct...
VISP_EXPORT double measureTimeMs()
VISP_EXPORT int wait(double t0, double t)
void registerArguments(vpJsonArgumentParser &parser)
vpImage< unsigned char > isSilhouette
Image containing the orientation of the gradients.
vpImage< float > silhouetteCanny