基于Rangenet Lib的自动驾驶LiDAR点云语义分割与可视化

RobotsRuning

已于 2024-06-01 17:55:26 修改

阅读量921

点赞数 14

文章标签：自动驾驶人工智能 KITTI Range_Net

于 2024-01-02 15:23:16 首次发布

本文链接：https://blog.csdn.net/u014374826/article/details/135341566

版权

这段代码是一个C++程序，用于处理来自KITTI数据集的激光雷达（LiDAR）扫描数据。程序主要实现以下功能：

1. **读取和解析命令行参数**：使用Boost库中的`program_options`模块来定义和解析命令行参数。这包括扫描文件路径、模型路径以及是否启用详细模式（verbose）。

2. **处理KITTI数据集中的LiDAR扫描数据**：程序遍历指定KITTI数据集目录中的LiDAR扫描数据（`.bin`格式）。这些数据包含了LiDAR扫描的点云信息。

3. **LiDAR数据的语义分割**：使用`rangenet_lib`库创建一个网络模型来进行语义分割。这个库用于为LiDAR点云数据提供语义标签，例如将点分类为车辆、行人、道路等。

4. **读取和处理每个扫描文件**：对每个扫描文件，程序读取点云数据，并使用创建的网络模型进行推理（infer），得到每个点的语义标签。

5. **转换点云数据**：获取转换后的点云数据和颜色掩膜（color mask），这些颜色表示不同的语义类别。

6. **保存语义分割结果**：将每个点的坐标和对应的颜色标签保存到文本文件中。这些文件用于可视化或进一步分析处理。

7. **可视化（可选）**：如果启用了详细模式（verbose），则使用OpenCV的可视化工具（`cv::viz`）来显示语义分割后的点云。

总的来说，这个程序的主要作用是处理KITTI数据集中的LiDAR点云数据，通过使用语义分割网络对每个点进行分类，然后将分类结果保存并（可选地）进行可视化展示。这对于自动驾驶、机器人导航等领域的研究和应用是非常有用的。

1. infer中的内容

/* Copyright (c) 2019 lifeiya, Chongqing University.
 *
 *  This file is part of advanced rangenet_lib.
 *
 */


// opencv stuff
#include <opencv2/core/core.hpp>
#include <opencv2/highgui/highgui.hpp>
#include <opencv2/imgproc/imgproc.hpp>
#include <opencv2/viz.hpp>

// c++ stuff
#include <chrono>
#include <iomanip>  
#include <iostream>
#include <string>
#include <sstream>

// net stuff
#include <selector.hpp>
namespace cl = rangenet::segmentation;

// boost
#include <boost/program_options.hpp>
namespace po = boost::program_options;
#include <boost/filesystem.hpp>
namespace fs = boost::filesystem;

typedef std::tuple< u_char, u_char, u_char> color;


int main(int argc, const char *argv[]) {
  // define options
  std::string scan;
  std::string path;
  std::string backend = "tensorrt";
 // 如果verbose为true，则程序会输出更多的运行过程信息，如果为false，则只输出最基本的信息。
  bool verbose = false;
  std::ostringstream scanStream;

  std::string kitti_num = "10"; // Replace "01" with the actual value you want
  std::string base_path = "/home/fairlee/dataset/KITTI/sequences_kitti_00_21/" + kitti_num + "/velodyne/";
  std::string file_extension = ".bin";

 // Calculate the number of files in the directory
  int N = std::distance(fs::directory_iterator(base_path), fs::directory_iterator{});

for(int file_num = 1000; file_num < N; ++file_num) {



// cout<<"正在处理-----"<<file_num<<"/"<< N <<"数据"<<endl;

std::cout << std::left << "正在处理 " <<kitti_num<< " 数据集中的第： "<< file_num << " / "  << N << " 帧数据" << std::endl;


  // Parse options
  try {
    po::options_description desc{"Options"};
    desc.add_options()("help,h", "Help screen")(
        "scan,s", po::value<std::string>(&scan),
        "LiDAR scan to infer. No Default")(
        "path,p", po::value<std::string>(),
        "Directory to get the inference model from. No default")(
        "verbose,v", po::bool_switch(),
        "Verbose mode. Calculates profile (time to run)");

    po::variables_map vm;
    po::store(parse_command_line(argc, argv, desc), vm);
    po::notify(vm);

    std::cout << std::setfill('=') << std::setw(80) << "" << std::endl;

    if (vm.count("help")) {
      std::cout << desc << std::endl;
      return 0;
    }


 std::ostringstream scanStream;
    scanStream << base_path << std::setfill('0') << std::setw(6) << file_num << file_extension;
    scan = scanStream.str();

    // make defaults count, parameter check, and print
      path = "/home/fairlee/darknet53/";

    if (vm.count("verbose")) {
      verbose = vm["verbose"].as<bool>();
      std::cout << "verbose: " << verbose << std::endl;
    } else {
      std::cout << "verbose: " << verbose << ". Using default!" << std::endl;
    }

    std::cout << std::setfill('=') << std::setw(80) << "" << std::endl;
  } catch (const po::error &ex) {
    std::cerr << ex.what() << std::endl;
    return 1;
  }

  // create a network
  std::unique_ptr<cl::Net> net = cl::make_net(path, backend);

  // set verbosity
  net->verbosity(verbose);

  // predict each image
  std::cout << std::setfill('=') << std::setw(80) << "" << std::endl;
  std::cout << "Predicting image: " << scan << std::endl;

  // Open a scan
  std::ifstream in(scan.c_str(), std::ios::binary);
  if (!in.is_open()) {
      std::cerr << "Could not open the scan!" << std::endl;
      return 1;
  }

  in.seekg(0, std::ios::end);
  uint32_t num_points = in.tellg() / (4 * sizeof(float));
  in.seekg(0, std::ios::beg);

  std::vector<float> values(4 * num_points);
  in.read((char*)&values[0], 4 * num_points * sizeof(float));

  // predict
  std::vector<std::vector<float>> semantic_scan = net->infer(values, num_points);

  // get point cloud
  std::vector<cv::Vec3f> points = net->getPoints(values, num_points);

  // get color mask
  std::vector<cv::Vec3b> color_mask = net->getLabels(semantic_scan, num_points);


   // Create output filename
    std::ostringstream outfileNameStream;
    outfileNameStream << "/home/fairlee/dataset/KITTI/sequences_kitti_00_21/" << kitti_num << "/RangeNet_point/" << std::setfill('0') << std::setw(6) << file_num << ".txt";
    std::string outfileName = outfileNameStream.str();

    // Create an ofstream object
    std::ofstream outfile(outfileName);

    if (!outfile) {
        std::cerr << "Unable to open output file: " << outfileName << std::endl;
        return 1;
    }

    // Iterate through each point and corresponding color
    for (size_t i = 0; i < points.size(); ++i) {
        // Write the point coordinates and color to the file
        outfile << points[i][0] << " " << points[i][1] << " " << points[i][2];
        outfile << " " << static_cast<int>(color_mask[i][0]) << " " << static_cast<int>(color_mask[i][1]) << " " << static_cast<int>(color_mask[i][2]) << "\n";
    }

    // Close the file
    outfile.close();

 Create an ofstream object
//std::ofstream outfile("output.txt");
 Iterate through each point and corresponding color
//for (size_t i = 0; i < points.size(); ++i) {
//  // Write the point coordinates and color to the file
//  outfile << points[i][0] << " " << points[i][1] << " " << points[i][2];
//  outfile << " " << static_cast<int>(color_mask[i][0]) << " " << static_cast<int>(color_mask[i][1]) << " " << static_cast<int>(color_mask[i][2]) << "\n";
//}
 Close the file
//outfile.close();


  // print the output
  if (verbose) {
    cv::viz::Viz3d window("semantic scan");
    cv::viz::WCloud cloudWidget(points, color_mask);
    while (!window.wasStopped()) {
      window.showWidget("cloud", cloudWidget);
      window.spinOnce(30, true);
    }
  }
  std::cout << std::setfill('=') << std::setw(80) << "" << std::endl;

  std::cout << "Example finished! "<< std::endl;


}

  return 0;
}