Skip to content

Commit

Permalink
dav2: Try to run on jetson, hitting mem limit
Browse files Browse the repository at this point in the history
  • Loading branch information
marcojob committed Nov 11, 2024
1 parent 7abc401 commit b7f290a
Show file tree
Hide file tree
Showing 9 changed files with 74 additions and 21 deletions.
3 changes: 2 additions & 1 deletion .devcontainer/devcontainer.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,8 @@
"customizations": {
"vscode": {
"extensions": [
"ms-vscode.cpptools"
"ms-vscode.cpptools",
"ms-iot.vscode-ros"
],
"settings": {
"files.hotExit": "off",
Expand Down
7 changes: 4 additions & 3 deletions CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -97,13 +97,14 @@ catkin_package(
add_executable(${PROJECT_NAME}_node src/usb_cam_node.cpp)
target_link_libraries(${PROJECT_NAME}_node
${PROJECT_NAME}
${catkin_LIBRARIES}
${avcodec_LIBRARIES}
${avutil_LIBRARIES}
${swscale_LIBRARIES}
${NVINFER}
${catkin_LIBRARIES}
${CUDA_LIBRARIES}
${NVINFER_PLUGIN}
${NVINFER}
${NVONNXPARSER}
${swscale_LIBRARIES}
)
set_target_properties(${PROJECT_NAME}_node PROPERTIES LINK_FLAGS "-Wl,--no-as-needed")

Expand Down
5 changes: 3 additions & 2 deletions include/usb_cam/learning/depth_anything_v2.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -9,12 +9,13 @@

class DepthAnythingV2 : public LearningInterface {
public:
DepthAnythingV2(ros::NodeHandle* nh, std::string model_path) {
DepthAnythingV2(ros::NodeHandle* nh, std::string model_path, std::string topic) {
_INPUT_SIZE = cv::Size(_HEIGHT, _WIDTH);
_model_path = model_path;
_load_model();

if (nh != nullptr) {
_depth_publication = nh->advertise<sensor_msgs::Image>("depth_anything_v2", 1);
_depth_publication = nh->advertise<sensor_msgs::Image>(topic, 1);
}
}

Expand Down
7 changes: 6 additions & 1 deletion include/usb_cam/learning/interface.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@
#include <algorithm>
#include <fstream>
#include <iostream>
#include <mutex>
#include <NvInfer.h>
#include <opencv2/opencv.hpp>
#include <sensor_msgs/Image.h>
Expand All @@ -18,7 +19,6 @@ class LearningInterface {
virtual void set_input(sensor_msgs::Image& image) = 0;
virtual void publish() = 0;

void load_model();
void predict();

nvinfer1::ICudaEngine* get_engine() { return _engine; }
Expand All @@ -37,9 +37,14 @@ class LearningInterface {
nvinfer1::IRuntime* _runtime;
std::string _model_path;

void _load_model();

private:
void* _buffers[2] = { nullptr, nullptr };

// Global mutex for prediction calls
static std::mutex predict_mutex;

// TODO: static?
class Logger : public nvinfer1::ILogger {
void log(Severity severity, const char* msg) noexcept override {
Expand Down
2 changes: 2 additions & 0 deletions include/usb_cam/usb_cam.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -119,6 +119,8 @@ typedef struct
// or guvcview
std::string pixel_format_name;
std::string av_device_format;
std::string dav2_file;
std::string dav2_topic;
int image_width;
int image_height;
int framerate;
Expand Down
6 changes: 6 additions & 0 deletions launch/two_mipi_rgb.launch
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,9 @@
<param name="wb_blue_gain" value="0.98"/>
<param name="wb_green_gain" value="0.88"/>
<param name="wb_red_gain" value="1.18"/>

<param name="depth_anything_v2_file" value="/home/asl/Workspace/src/v4l2_camera/test/resources/depth_anything_v2_vits_16.onnx" />
<param name="depth_anything_v2_topic" value="/depth0" />
</node>

<node name="cam1" pkg="usb_cam" type="usb_cam_node" output="screen" >
Expand All @@ -35,5 +38,8 @@
<param name="wb_blue_gain" value="0.98"/>
<param name="wb_green_gain" value="0.88"/>
<param name="wb_red_gain" value="1.18"/>

<!-- <param name="depth_anything_v2_file" value="/home/asl/Workspace/src/v4l2_camera/test/resources/depth_anything_v2_vits_16.onnx" /> -->
<!-- <param name="depth_anything_v2_topic" value="/depth1" /> -->
</node>
</launch>
51 changes: 42 additions & 9 deletions src/interface.cpp
Original file line number Diff line number Diff line change
@@ -1,9 +1,19 @@
#include "usb_cam/learning/interface.hpp"
#include <NvOnnxParser.h>
#include <ros/ros.h>

using namespace nvinfer1;

void LearningInterface::load_model() {
std::mutex LearningInterface::predict_mutex;

void LearningInterface::_load_model() {
std::ifstream file_check(_model_path);
if (!file_check.good()) {
std::cerr << "Error: " << _model_path << "' does not exist." << std::endl;
throw std::runtime_error("Model file not found");
}
file_check.close();

if (_model_path.find(".onnx") == std::string::npos) {
std::ifstream engine_stream(_model_path, std::ios::binary);
engine_stream.seekg(0, std::ios::end);
Expand All @@ -27,11 +37,19 @@ void LearningInterface::load_model() {
}

// Define input dimensions
const auto input_dims = _engine->getTensorShape(_engine->getIOTensorName(0));
const int input_h = input_dims.d[2];
const int input_w = input_dims.d[3];
// TODO: Check dimensions, set as members
#if NV_TENSORRT_MAJOR < 10
auto input_dims = _engine->getBindingDimensions(0);
auto output_dims = _engine->getBindingDimensions(1);
#else
auto input_dims = _engine->getTensorShape(_engine->getIOTensorName(0));
auto output_dims = _engine->getTensorShape(_engine->getIOTensorName(1));
#endif

const size_t input_h = input_dims.d[2];
const size_t input_w = input_dims.d[3];
ROS_INFO("%ld, %ld", input_h, input_w);

// Create CUDA stream
cudaStreamCreate(&_stream);

cudaMalloc(&_buffers[0], 3 * input_h * input_w * sizeof(float));
Expand Down Expand Up @@ -88,10 +106,25 @@ bool LearningInterface::_save_engine(const std::string& onnx_path) {
}

void LearningInterface::predict() {
cudaMemcpyAsync(_buffers[0], _input_data, sizeof(_input_data) * sizeof(float), cudaMemcpyHostToDevice, _stream);
_context->executeV2(_buffers);
cudaStreamSynchronize(_stream);
cudaMemcpyAsync(_output_data, _buffers[1], sizeof(_input_data) * sizeof(float), cudaMemcpyDeviceToHost);
if (predict_mutex.try_lock()) {
ROS_INFO("INSIDE PREDICT");
// TODO: Use input, output size members to set memcpy size correctly
cudaMemcpyAsync(_buffers[0], _input_data, 0, cudaMemcpyHostToDevice, _stream);

#if NV_TENSORRT_MAJOR < 10
_context->enqueueV2(_buffers, _stream, nullptr);
#else
_context->executeV2(_buffers);
#endif

cudaStreamSynchronize(_stream);
// TODO: Use input, output size members to set memcpy size correctly
cudaMemcpyAsync(_output_data, _buffers[1], 0, cudaMemcpyDeviceToHost);
predict_mutex.unlock();

} else {
ROS_INFO("predict in progress, skipping");
}
}

LearningInterface::~LearningInterface() {
Expand Down
12 changes: 8 additions & 4 deletions src/usb_cam_node.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -71,10 +71,6 @@ class UsbCamNode {
}

UsbCamNode() : m_node("~") {
// Setup the network that outputs derivates of the image captured
// TODO: Actual network
networks.push_back(std::make_unique<DepthAnythingV2>(&m_node, "depth_anything_v2_vitb.onnx"));

// Advertise the main image topic
image_transport::ImageTransport it(m_node);
m_image_pub = it.advertiseCamera("image_raw", 1);
Expand Down Expand Up @@ -127,6 +123,14 @@ class UsbCamNode {
m_camera_info->setCameraInfo(camera_info);
}

// Setup the network that outputs derivates of the image captured
m_node.param("depth_anything_v2_file", m_parameters.dav2_file, std::string(""));
m_node.param("depth_anything_v2_topic", m_parameters.dav2_topic, std::string(""));

if (!m_parameters.dav2_file.empty() && !m_parameters.dav2_topic.empty()) {
networks.push_back(std::make_unique<DepthAnythingV2>(&m_node, m_parameters.dav2_file, m_parameters.dav2_topic));
}

ROS_INFO("Starting '%s' (%s) at %dx%d via %s (%s) at %i FPS",
m_parameters.camera_name.c_str(), m_parameters.device_name.c_str(),
m_parameters.image_width, m_parameters.image_height, m_parameters.io_method_name.c_str(),
Expand Down
2 changes: 1 addition & 1 deletion test/test_depth_anything_v2.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@
// This class provides access to protected members that we normally don't want to expose
class DepthAnythingV2Test : public DepthAnythingV2 {
public:
DepthAnythingV2Test(const std::string& model_path) : DepthAnythingV2(nullptr, model_path) {}
DepthAnythingV2Test(const std::string& model_path) : DepthAnythingV2(nullptr, model_path, std::string("")) {}
float* get_input_data() { return _input_data; }
};

Expand Down

0 comments on commit b7f290a

Please sign in to comment.