Example of eye-to-hand image-based control law. We control here a real robot, the Franka Emika Panda robot (arm with 7 degrees of freedom). An Apriltag is attached to the robot end-effector. A camera mounted on a fixed tripod is observing the Apriltag. The velocity is computed in the camera frame. The inverse jacobian that converts cartesian velocities in joint velocities is implemented in the robot low level controller. Visual features are the image coordinates of 4 points corresponding to the corners of an AprilTag.
The device used to acquire images is a Realsense D435 device.
Camera extrinsic (eMo) transformation is set by default to a value that will not match Your configuration.
In this example we show that it is possible to achieve the visual-servoing without pose estimation:
#include <iostream>
#include <fstream>
#include <visp3/core/vpConfig.h>
#include <visp3/core/vpCameraParameters.h>
#include <visp3/core/vpIoTools.h>
#include <visp3/core/vpXmlParserCamera.h>
#include <visp3/detection/vpDetectorAprilTag.h>
#include <visp3/gui/vpDisplayFactory.h>
#include <visp3/gui/vpPlot.h>
#include <visp3/io/vpImageIo.h>
#include <visp3/robot/vpRobotFranka.h>
#include <visp3/sensor/vpRealSense2.h>
#include <visp3/visual_features/vpFeatureBuilder.h>
#include <visp3/visual_features/vpFeaturePoint.h>
#include <visp3/vs/vpServo.h>
#include <visp3/vs/vpServoDisplay.h>
#if defined(VISP_HAVE_REALSENSE2) && defined(VISP_HAVE_DISPLAY) && defined(VISP_HAVE_FRANKA) && defined(VISP_HAVE_PUGIXML)
#ifdef ENABLE_VISP_NAMESPACE
#endif
bool save_desired_features(const std::string &filename, const std::vector<vpFeaturePoint> &desired_features)
{
std::ofstream file(filename);
if (file.is_open()) {
for (size_t i = 0; i < desired_features.size(); ++i) {
file << desired_features[i].get_x() << " " << desired_features[i].get_y() << " " << desired_features[i].get_Z() << std::endl;
}
file.close();
return true;
}
else {
return false;
}
}
bool read_desired_features(const std::string &filename, std::vector<vpFeaturePoint> &desired_features)
{
desired_features.clear();
std::ifstream file(filename);
if (file.is_open()) {
std::string line;
while (std::getline(file, line)) {
std::istringstream iss(line);
double x, y, Z;
if (!(iss >> x >> y >> Z)) {
return false;
}
desired_features.push_back(s_d);
}
file.close();
return true;
}
else {
return false;
}
}
std::vector<vpImagePoint> *traj_vip)
{
for (
size_t i = 0;
i < vip.size(); ++
i) {
if (traj_vip[i].size()) {
traj_vip[
i].push_back(vip[i]);
}
}
else {
traj_vip[
i].push_back(vip[i]);
}
}
for (
size_t i = 0;
i < vip.size(); ++
i) {
for (
size_t j = 1;
j < traj_vip[
i].size();
j++) {
}
}
}
int main(int argc, char **argv)
{
double opt_tag_size = 0.120;
bool opt_tag_z_aligned = false;
std::string opt_robot_ip = "192.168.1.1";
std::string opt_rMc_filename = "";
std::string opt_intrinsic_filename = "";
std::string opt_camera_name = "Camera";
bool display_tag = true;
int opt_quad_decimate = 2;
bool opt_verbose = false;
bool opt_plot = false;
bool opt_adaptive_gain = false;
bool opt_task_sequencing = false;
bool opt_learn_desired_features = false;
std::string desired_features_filename = "learned_desired_features.txt";
double convergence_threshold = 0.00005;
for (
int i = 1;
i < argc; ++
i) {
if ((std::string(argv[i]) == "--tag-size") && (i + 1 < argc)) {
opt_tag_size = std::stod(argv[++i]);
}
else if (std::string(argv[i]) == "--tag-z-aligned") {
opt_tag_z_aligned = true;
}
else if ((std::string(argv[i]) == "--ip") && (i + 1 < argc)) {
opt_robot_ip = std::string(argv[++i]);
}
else if (std::string(argv[i]) == "--intrinsic" && i + 1 < argc) {
opt_intrinsic_filename = std::string(argv[++i]);
}
else if (std::string(argv[i]) == "--camera-name" && i + 1 < argc) {
opt_camera_name = std::string(argv[++i]);
}
else if ((std::string(argv[i]) == "--rMc") && (i + 1 < argc)) {
opt_rMc_filename = std::string(argv[++i]);
}
else if ((std::string(argv[i]) == "--verbose") || (std::string(argv[i]) == "-v")) {
opt_verbose = true;
}
else if (std::string(argv[i]) == "--plot") {
opt_plot = true;
}
else if (std::string(argv[i]) == "--adaptive-gain") {
opt_adaptive_gain = true;
}
else if (std::string(argv[i]) == "--task-sequencing") {
opt_task_sequencing = true;
}
else if ((std::string(argv[i]) == "--tag-quad-decimate") && (i + 1 < argc)) {
opt_quad_decimate = std::stoi(argv[++i]);
}
else if (std::string(argv[i]) == "--no-convergence-threshold") {
convergence_threshold = 0.;
}
else if (std::string(argv[i]) == "--learn-desired-features") {
opt_learn_desired_features = true;
}
else if ((std::string(argv[i]) == "--help") || (std::string(argv[i]) == "-h")) {
std::cout << "SYNOPSYS" << std::endl
<< " " << argv[0]
<< " [--ip <controller ip>]"
<< " [--intrinsic <xml file>]"
<< " [--camera-name <name>]"
<< " [--tag-size <size>]"
<< " [--tag-quad-decimate <decimation factor>]"
<< " [--tag-z-aligned]"
<< " [--learn-desired-features]"
<< " [--rMc <file.yaml>]"
<< " [--adaptive-gain]"
<< " [--plot]"
<< " [--task-sequencing]"
<< " [--no-convergence-threshold]"
<< " [--verbose, -v]"
<< " [--help, -h]\n"
<< std::endl;
std::cout << "DESCRIPTION" << std::endl
<< " Use an image-based visual-servoing scheme to position the camera in front of an Apriltag." << std::endl
<< std::endl
<< " --ip <controller ip>" << std::endl
<< " Franka controller ip address" << std::endl
<< " Default: " << opt_robot_ip << std::endl
<< std::endl
<< " --intrinsic <xml file>" << std::endl
<< " XML file that contains camera intrinsic parameters. " << std::endl
<< " If no file is specified, use Realsense camera factory intrinsic parameters." << std::endl
<< std::endl
<< " --camera-name <name>" << std::endl
<< " Camera name in the XML file that contains camera intrinsic parameters." << std::endl
<< " Default: \"Camera\"" << std::endl
<< std::endl
<< " --tag-size <size>" << std::endl
<< " Apriltag size in [m]." << std::endl
<< " Default: " << opt_tag_size << " [m]" << std::endl
<< std::endl
<< " --tag-quad-decimate <decimation factor>" << std::endl
<< " Decimation factor used during Apriltag detection." << std::endl
<< " Default: " << opt_quad_decimate << std::endl
<< std::endl
<< " --tag-z-aligned" << std::endl
<< " When enabled, tag z-axis and camera z-axis are aligned." << std::endl
<< " Default: false" << std::endl
<< std::endl
<< " --rMc <file.yaml>" << std::endl
<< " Yaml file containing the extrinsic transformation between" << std::endl
<< " robot reference frame and camera frames." << std::endl
<< std::endl
<< " --adaptive-gain" << std::endl
<< " Flag to enable adaptive gain to speed up visual servo near convergence." << std::endl
<< std::endl
<< " --plot" << std::endl
<< " Flag to enable curve plotter." << std::endl
<< std::endl
<< " --task-sequencing" << std::endl
<< " Flag to enable task sequencing scheme." << std::endl
<< std::endl
<< " --no-convergence-threshold" << std::endl
<< " Flag to disable convergence threshold used to stop the visual servo." << std::endl
<< std::endl
<< " --learn-desired-pose" << std::endl
<< " Flag to enable desired pose learning." << std::endl
<< " Data are saved in learned-desired-pose.yaml file." << std::endl
<< std::endl
<< " --verbose, -v" << std::endl
<< " Flag to enable extra verbosity." << std::endl
<< std::endl
<< " --help, -h" << std::endl
<< " Print this helper message." << std::endl
<< std::endl;
return EXIT_SUCCESS;
}
else {
std::cout << "\nERROR" << std::endl
<< std::string(argv[i]) << " command line option is not supported." << std::endl
<< "Use " << std::string(argv[0]) << " --help" << std::endl
<< std::endl;
return EXIT_FAILURE;
}
}
config.enable_stream(RS2_STREAM_COLOR, 640, 480, RS2_FORMAT_RGBA8, 30);
config.enable_stream(RS2_STREAM_DEPTH, 640, 480, RS2_FORMAT_Z16, 30);
config.enable_stream(RS2_STREAM_INFRARED, 640, 480, RS2_FORMAT_Y8, 30);
#if (VISP_CXX_STANDARD >= VISP_CXX_STANDARD_11)
#else
#endif
std::cout << "Parameters:" << std::endl;
std::cout << " Apriltag " << std::endl;
std::cout << " Size [m] : " << opt_tag_size << std::endl;
std::cout << " Z aligned : " << (opt_tag_z_aligned ? "true" : "false") << std::endl;
std::cout << " Camera intrinsics " << std::endl;
std::cout << " Factory parameters : " << (opt_intrinsic_filename.empty() ? "yes" : "no") << std::endl;
if (opt_intrinsic_filename.empty()) {
std::cout << "Use Realsense camera intrinsic factory parameters: " << std::endl;
std::cout <<
"cam:\n" <<
cam << std::endl;
}
std::cout << "Camera parameters file " << opt_intrinsic_filename << " doesn't exist." << std::endl;
return EXIT_FAILURE;
}
else {
if (!opt_camera_name.empty()) {
std::cout << " Param file name [.xml]: " << opt_intrinsic_filename << std::endl;
std::cout << " Camera name : " << opt_camera_name << std::endl;
std::cout << "Unable to parse parameters with distortion for camera \"" << opt_camera_name << "\" from "
<< opt_intrinsic_filename << " file" << std::endl;
std::cout << "Attempt to find parameters without distortion" << std::endl;
if (
parser.parse(cam, opt_intrinsic_filename, opt_camera_name,
std::cout << "Unable to parse parameters without distortion for camera \"" << opt_camera_name << "\" from "
<< opt_intrinsic_filename << " file" << std::endl;
return EXIT_FAILURE;
}
}
}
}
std::cout <<
"Camera parameters used to compute the pose:\n" <<
cam << std::endl;
detector.setAprilTagPoseEstimationMethod(poseEstimationMethod);
detector.setDisplayTag(display_tag);
detector.setAprilTagQuadDecimate(opt_quad_decimate);
detector.setZAlignedWithCameraAxis(opt_tag_z_aligned);
if (opt_learn_desired_features) {
bool quit = false;
while (!quit) {
std::vector<vpHomogeneousMatrix> c_M_o_vec;
bool ret = detector.detect(I, opt_tag_size, cam, c_M_o_vec);
std::vector< std::vector<vpImagePoint> > tags_corners;
if (ret) {
if (detector.getNbObjects() == 1) {
tags_corners = detector.getTagsCorners();
for (
size_t i = 0;
i < 4; ++
i) {
std::stringstream ss;
}
}
}
switch (button) {
if (ret) {
if (detector.getNbObjects() == 1) {
std::vector<vpFeaturePoint> p_d(4);
for (
size_t i = 0;
i < 4; ++
i) {
std::stringstream ss;
}
std::vector<vpPoint> point(4);
point[0].setWorldCoordinates(-opt_tag_size / 2., -opt_tag_size / 2., 0);
point[1].setWorldCoordinates(+opt_tag_size / 2., -opt_tag_size / 2., 0);
point[2].setWorldCoordinates(+opt_tag_size / 2., +opt_tag_size / 2., 0);
point[3].setWorldCoordinates(-opt_tag_size / 2., +opt_tag_size / 2., 0);
for (
size_t i = 0;
i < point.size(); ++
i) {
point[
i].changeFrame(cd_M_o, c_P);
}
if (save_desired_features(desired_features_filename, p_d)) {
std::cout << "Desired visual features saved in: " << desired_features_filename << std::endl;
}
else {
std::cout << "Error: Unable to save desired features in " << desired_features_filename << std::endl;
return EXIT_FAILURE;
}
}
else {
std::cout << "Cannot save desired features. More than 1 tag is visible in the image..." << std::endl;
}
}
else {
std::cout << "Cannot save desired features. Tag is not visible in the image..." << std::endl;
}
break;
quit = true;
break;
default:
break;
}
}
}
return EXIT_SUCCESS;
}
std::vector<vpFeaturePoint> p_d;
std::cout << "Cannot start eye-to-hand visual-servoing. Desired features are not available." << std::endl;
std::cout << "use --learn-desired-features flag to learn the desired features." << std::endl;
return EXIT_FAILURE;
}
else {
if (!read_desired_features(desired_features_filename, p_d)) {
std::cout << "Error: Unable to read desired features from: " << desired_features_filename << std::endl;
return EXIT_FAILURE;
}
}
if (!opt_rMc_filename.empty()) {
r_P_c.
loadYAML(opt_rMc_filename, r_P_c);
}
else {
std::cout << "Warning, rMc transformation is not specified using --rMc parameter." << std::endl;
return EXIT_FAILURE;
}
std::cout << "r_M_c:\n" << r_M_c << std::endl;
try {
robot.connect(opt_robot_ip);
std::vector<vpFeaturePoint>
p(4);
for (
size_t i = 0;
i <
p.size(); ++
i) {
task.addFeature(p[i], p_d[i]);
}
if (opt_adaptive_gain) {
}
else {
}
task.set_cVf(r_M_c.inverse());
int iter_plot = 0;
if (opt_plot) {
plotter =
new vpPlot(2,
static_cast<int>(250 * 2), 500,
static_cast<int>(I.getWidth()) + 80, 10,
"Real time curves plotter");
plotter->setTitle(0,
"Visual features error");
plotter->setTitle(1,
"Joint velocities");
plotter->setLegend(0, 0,
"error_feat_p1_x");
plotter->setLegend(0, 1,
"error_feat_p1_y");
plotter->setLegend(0, 2,
"error_feat_p2_x");
plotter->setLegend(0, 3,
"error_feat_p2_y");
plotter->setLegend(0, 4,
"error_feat_p3_x");
plotter->setLegend(0, 5,
"error_feat_p3_y");
plotter->setLegend(0, 6,
"error_feat_p4_x");
plotter->setLegend(0, 7,
"error_feat_p4_y");
}
bool final_quit = false;
bool has_converged = false;
bool send_velocities = false;
bool servo_started = false;
std::vector<vpImagePoint> *traj_corners = nullptr;
while (!has_converged && !final_quit) {
bool ret = detector.detect(I);
{
std::stringstream ss;
ss << "Left click to " << (send_velocities ? "stop the robot" : "servo the robot") << ", right click to quit.";
}
if (ret && detector.getNbObjects() == 1) {
static bool first_time = true;
std::vector<vpImagePoint> corners = detector.getPolygon(0);
for (
size_t i = 0;
i < corners.size(); ++
i) {
}
robot.get_eJe(e_J_e);
if (opt_task_sequencing) {
if (!servo_started) {
if (send_velocities) {
servo_started = true;
}
}
}
else {
qdot =
task.computeControlLaw();
}
for (
size_t i = 0;
i < corners.size(); ++
i) {
std::stringstream ss;
}
if (first_time) {
traj_corners = new std::vector<vpImagePoint>[corners.size()];
}
display_point_trajectory(I, corners, traj_corners);
if (opt_plot) {
iter_plot++;
}
if (opt_verbose) {
std::cout << "qdot: " << qdot.t() << std::endl;
}
std::stringstream ss;
ss <<
"error: " <<
error;
if (opt_verbose)
std::cout <<
"error: " <<
error << std::endl;
if (error < convergence_threshold) {
has_converged = true;
std::cout << "Servo task has converged" << std::endl;
}
if (first_time) {
first_time = false;
}
}
else {
qdot = 0;
}
if (!send_velocities) {
qdot = 0;
}
{
std::stringstream ss;
}
switch (button) {
send_velocities = !send_velocities;
break;
final_quit = true;
qdot = 0;
break;
default:
break;
}
}
}
std::cout << "Stop the robot " << std::endl;
if (opt_plot && plotter != nullptr) {
}
if (!final_quit) {
while (!final_quit) {
final_quit = true;
}
}
}
if (traj_corners) {
delete[] traj_corners;
}
}
std::cout <<
"ViSP exception: " <<
e.what() << std::endl;
std::cout << "Stop the robot " << std::endl;
#if (VISP_CXX_STANDARD < VISP_CXX_STANDARD_11)
if (display != nullptr) {
delete display;
}
#endif
return EXIT_FAILURE;
}
catch (const franka::NetworkException &e) {
std::cout <<
"Franka network exception: " <<
e.what() << std::endl;
std::cout << "Check if you are connected to the Franka robot"
<< " or if you specified the right IP using --ip command line option set by default to 192.168.1.1. "
<< std::endl;
#if (VISP_CXX_STANDARD < VISP_CXX_STANDARD_11)
if (display != nullptr) {
delete display;
}
#endif
return EXIT_FAILURE;
}
catch (const std::exception &e) {
std::cout <<
"Franka exception: " <<
e.what() << std::endl;
#if (VISP_CXX_STANDARD < VISP_CXX_STANDARD_11)
if (display != nullptr) {
delete display;
}
#endif
return EXIT_FAILURE;
}
#if (VISP_CXX_STANDARD < VISP_CXX_STANDARD_11)
if (display != nullptr) {
delete display;
}
#endif
return EXIT_SUCCESS;
}
#else
int main()
{
#if !defined(VISP_HAVE_REALSENSE2)
std::cout << "Install librealsense-2.x and rebuild ViSP." << std::endl;
#endif
#if !defined(VISP_HAVE_FRANKA)
std::cout << "Install libfranka and rebuild ViSP." << std::endl;
#endif
#if !defined(VISP_HAVE_PUGIXML)
std::cout << "Build ViSP with pugixml support enabled." << std::endl;
#endif
return EXIT_SUCCESS;
}
#endif
Adaptive gain computation.
static bool loadYAML(const std::string &filename, vpArray2D< Type > &A, char *header=nullptr)
Generic class defining intrinsic camera parameters.
@ perspectiveProjWithDistortion
Perspective projection with distortion model.
@ perspectiveProjWithoutDistortion
Perspective projection without distortion model.
Implementation of column vector and the associated operations.
static const vpColor green
@ TAG_36h11
AprilTag 36h11 pattern (recommended).
Class that defines generic functionalities for display.
static bool getClick(const vpImage< unsigned char > &I, bool blocking=true)
static void display(const vpImage< unsigned char > &I)
static void displayLine(const vpImage< unsigned char > &I, const vpImagePoint &ip1, const vpImagePoint &ip2, const vpColor &color, unsigned int thickness=1, bool segment=true)
static void displayCross(const vpImage< unsigned char > &I, const vpImagePoint &ip, unsigned int size, const vpColor &color, unsigned int thickness=1)
static void flush(const vpImage< unsigned char > &I)
static void displayText(const vpImage< unsigned char > &I, const vpImagePoint &ip, const std::string &s, const vpColor &color)
error that can be emitted by ViSP classes.
static void create(vpFeaturePoint &s, const vpCameraParameters &cam, const vpDot &d)
Class that defines a 2D point visual feature which is composed by two parameters that are the cartes...
vpFeaturePoint & buildFrom(const double &x, const double &y, const double &Z)
Implementation of an homogeneous matrix and operations on such kind of matrices.
Class that defines a 2D point in an image. This class is useful for image processing and stores only ...
static double distance(const vpImagePoint &iP1, const vpImagePoint &iP2)
Definition of the vpImage class member functions.
Implementation of a matrix and operations on matrices.
static void convertPoint(const vpCameraParameters &cam, const double &x, const double &y, double &u, double &v)
static void convertPoint(const vpCameraParameters &cam, const double &u, const double &v, double &x, double &y)
This class enables real time drawing of 2D or 3D graphics. An instance of the class open a window whi...
Implementation of a pose vector and operations on poses.
vpCameraParameters getCameraParameters(const rs2_stream &stream, vpCameraParameters::vpCameraParametersProjType type=vpCameraParameters::perspectiveProjWithDistortion, int index=-1) const
void acquire(vpImage< unsigned char > &grey, double *ts=nullptr)
bool open(const rs2::config &cfg=rs2::config())
@ STATE_VELOCITY_CONTROL
Initialize the velocity controller.
@ STATE_STOP
Stops robot motion especially in velocity and acceleration control.
static void display(const vpServo &s, const vpCameraParameters &cam, const vpImage< unsigned char > &I, vpColor currentColor=vpColor::green, vpColor desiredColor=vpColor::red, unsigned int thickness=1)
@ EYETOHAND_L_cVf_fVe_eJe
XML parser to load and save intrinsic camera parameters.
std::shared_ptr< vpDisplay > createDisplay()
Return a smart pointer vpDisplay specialization if a GUI library is available or nullptr otherwise.
vpDisplay * allocateDisplay()
Return a newly allocated vpDisplay specialization if a GUI library is available or nullptr otherwise.
VISP_EXPORT double measureTimeMs()