mohammedari
diff --git a/‎opengl_ros/launch/object_position_extraction.launch‎
Lines changed: 19 additions & 8 deletions b/‎opengl_ros/launch/object_position_extraction.launch‎
Lines changed: 19 additions & 8 deletions
diff --git a/‎opengl_ros/src/object_position_extractor_nodecore.cpp‎
Lines changed: 26 additions & 15 deletions b/‎opengl_ros/src/object_position_extractor_nodecore.cpp‎
Lines changed: 26 additions & 15 deletions
diff --git a/‎opengl_ros/src/object_position_extractor_nodecore.h‎
Lines changed: 5 additions & 18 deletions b/‎opengl_ros/src/object_position_extractor_nodecore.h‎
Lines changed: 5 additions & 18 deletions
diff --git a/‎opengl_ros_lib/src/object_position_extractor.cpp‎
Lines changed: 6 additions & 0 deletions b/‎opengl_ros_lib/src/object_position_extractor.cpp‎
Lines changed: 6 additions & 0 deletions
@@ -3,24 +3,30 @@
   <arg name="bag_prefix"                    default="/mnt/log/d435"/>
   <arg name="depth_width"                   default="640"/>
   <arg name="depth_height"                  default="360"/>
-  <arg name="output_width"                  default="320"/>
-  <arg name="output_height"                 default="180"/>
   <arg name="frame_rate"                    default="30"/>
 
+  <!-- use small size image to accumulate in CPU -->
+  <arg name="output_width"                  default="160"/>
+  <arg name="output_height"                 default="90"/>
+
   <!-- valid depth range of D435 -->
   <arg name="depth_min"                     default="0.105"/>
   <arg name="depth_max"                     default="10"/>
 
   <!-- color extraction parameter -->
   <arg name="threshold_l"                   default="50"/>
-  <arg name="svm_coef_a"                    default="0.266602955271"/>
-  <arg name="svm_coef_b"                    default="0.0444656815907"/>
-  <arg name="svm_intercept"                 default="-44.3271851592"/>
+  <arg name="svm_coef_a"                    default="0.181817179054"/>
+  <arg name="svm_coef_b"                    default="-0.0205828687538"/>
+  <arg name="svm_intercept"                 default="-27.8266303282"/>
 
   <!-- object position extraction parameter -->
-  <arg name="object_separation_distance"    default="1"/>
-  <arg name="min_pixel_count_for_detection" default="15"/>
-  <arg name="sigma_coefficient"             default="2"/>
+  <arg name="object_separation_distance"    default="2"/>
+  <arg name="min_pixel_count_for_detection" default="30"/> <!-- specify in input resolution -->
+  <arg name="sigma_coefficient"             default="0.25"/>
+  <arg name="object_size_min_x"             default="0.175"/>
+  <arg name="object_size_max_x"             default="0.5"/>
+  <arg name="object_size_min_y"             default="0.175"/>
+  <arg name="object_size_max_y"             default="0.5"/>
 
   <arg name="d435"                          default="false"/>
   <arg name="viewer"                        default="false"/>
@@ -77,6 +83,11 @@
     <param name="min_pixel_count_for_detection" value="$(arg min_pixel_count_for_detection)"/>
     <param name="sigma_coefficient"             value="$(arg sigma_coefficient)"/>
 
+    <param name="object_size_min_x"         value="$(arg object_size_min_x)"/>
+    <param name="object_size_max_x"         value="$(arg object_size_max_x)"/>
+    <param name="object_size_min_y"         value="$(arg object_size_min_y)"/>
+    <param name="object_size_max_y"         value="$(arg object_size_max_y)"/>
+
     <param name="vertex_shader"             value="$(find opengl_ros_lib)/shader/vs_object_position_extraction.glsl"/>
     <param name="fragment_shader"           value="$(find opengl_ros_lib)/shader/fs_object_position_extraction.glsl"/>
 
 
@@ -28,6 +28,10 @@ ObjectPositionExtractorNode::ObjectPositionExtractorNode(const ros::NodeHandle&
     nh_.param<double>("object_separation_distance", object_separation_distance_, 2);
     nh_.param<int>("min_pixel_count_for_detection", min_pixel_count_for_detection_, 10);
     nh_.param<double>("sigma_coefficient_", sigma_coefficient_, 2);
+    nh_.param<double>("object_size_min_x", object_size_min_x_, 0.1);
+    nh_.param<double>("object_size_max_x", object_size_max_x_, 0.5);
+    nh_.param<double>("object_size_min_y", object_size_min_y_, 0.1);
+    nh_.param<double>("object_size_max_y", object_size_max_y_, 0.5);
 
     //OpenGL parameters
     int color_width, color_height;
@@ -133,8 +137,8 @@ void ObjectPositionExtractorNode::depthCallback(const sensor_msgs::Image::ConstP
     extractor_->updateProjectionMatrix(
         {static_cast<float>(latestColorCameraInfo.K[0]), static_cast<float>(latestColorCameraInfo.K[4])}, 
         {static_cast<float>(latestColorCameraInfo.K[2]), static_cast<float>(latestColorCameraInfo.K[5])}, 
-        {static_cast<float>(cameraInfoMsg->K[0])           , static_cast<float>(cameraInfoMsg->K[4])}, 
-        {static_cast<float>(cameraInfoMsg->K[2])           , static_cast<float>(cameraInfoMsg->K[5])}, 
+        {static_cast<float>(cameraInfoMsg->K[0])       , static_cast<float>(cameraInfoMsg->K[4])}, 
+        {static_cast<float>(cameraInfoMsg->K[2])       , static_cast<float>(cameraInfoMsg->K[5])}, 
         latestDepthToColor_
     );
 
@@ -154,21 +158,23 @@ void ObjectPositionExtractorNode::depthCallback(const sensor_msgs::Image::ConstP
     std::vector<ObjectPositionExtractorNode::ObjectCandidate> candidates;
     for (auto it = positionOut_.begin<cv::Vec4f>(); it != positionOut_.end<cv::Vec4f>(); ++it)
     {
-        auto x = (*it)[0];
-        auto y = (*it)[1];
-        auto z = (*it)[2];
+        auto x = (*it)[0]; //
+        auto y = (*it)[1]; //
+        auto z = (*it)[2]; //accumulated coordinate value
+        auto w = (*it)[3]; //number of accumulated point 
 
         //Not detected at this pixel
-        if (x == 0 && y == 0 && z == 0)
+        if (w == 0)
             continue;
 
-        Eigen::Vector3d point(x, y, z);
+        Eigen::Vector3d point(x / w, y / w, z / w); 
+        int accumulated_pixel_count = static_cast<int>(std::round(w));
 
         //If this is the first point, just add it to the candidates
         if (candidates.size() == 0)
         {
             candidates.emplace_back();
-            candidates[0].add(point);
+            candidates[0].add(point, accumulated_pixel_count);
             continue;
         }
 
@@ -181,12 +187,12 @@ void ObjectPositionExtractorNode::depthCallback(const sensor_msgs::Image::ConstP
         if (object_separation_distance_ < minDistance)
         {
             candidates.emplace_back();
-            candidates[candidates.size() - 1].add(point);
+            candidates[candidates.size() - 1].add(point, accumulated_pixel_count);
             continue;
         }
 
         //Add the point to the neareset candidate
-        candidates[minIndex].add(point);
+        candidates[minIndex].add(point, accumulated_pixel_count);
     }
 
     //Publish Object Array
@@ -195,14 +201,19 @@ void ObjectPositionExtractorNode::depthCallback(const sensor_msgs::Image::ConstP
     {
         auto sigma = candidate.variance();
 
-        auto count = candidate.count(sigma_coefficient_ * sigma);
-        if (count < min_pixel_count_for_detection_)
+        //If number of pixel is lower than threshold, skip it
+        if (candidate.number_of_detected_pixels < min_pixel_count_for_detection_)
             continue;
 
-        ROS_INFO_STREAM("detected object (" << count << "/" << candidate.count() << "px)");
+        //If the size of the object along the camera direction is too small or too large, skip it
+        auto candidate_size = candidate.size(sigma_coefficient_ * sigma);
+        if (candidate_size.x() < object_size_min_x_ || object_size_max_x_ < candidate_size.x() || 
+            candidate_size.y() < object_size_min_y_ || object_size_max_y_ < candidate_size.y())
+            continue;
+
+        ROS_INFO_STREAM("detected object (" << candidate.number_of_detected_pixels << "px)");
 
         auto candidate_pose = candidate.mean(sigma_coefficient_ * sigma);
-        auto candidate_size = candidate.size(sigma_coefficient_ * sigma);
         geometry_msgs::Pose pose;
         {
             pose.position.x = candidate_pose.x();
@@ -229,7 +240,7 @@ void ObjectPositionExtractorNode::depthCallback(const sensor_msgs::Image::ConstP
         o.pose = pose;
         o.twist = zero_twist;
         o.size = size;
-        o.confidence = static_cast<double>(count) / candidate.count(); //set number of pixels in threshold as confidence
+        o.confidence = 1.0; //TODO
 
         objectArray.objects.push_back(o);
     }
 
@@ -45,6 +45,8 @@ class ObjectPositionExtractorNode
     double object_separation_distance_;
     int min_pixel_count_for_detection_;
     double sigma_coefficient_;
+    double object_size_min_x_, object_size_max_x_;
+    double object_size_min_y_, object_size_max_y_;
 
     void colorCallback(const sensor_msgs::Image::ConstPtr& imageMsg, const sensor_msgs::CameraInfoConstPtr & cameraInfoMsg);
     void depthCallback(const sensor_msgs::Image::ConstPtr& imageMsg, const sensor_msgs::CameraInfoConstPtr & cameraInfoMsg);
@@ -56,11 +58,13 @@ class ObjectPositionExtractorNode
     {
         std::vector<Eigen::Vector3d> points;
         Eigen::Vector3d sum = {};
+        int number_of_detected_pixels = 0;
 
-        void add(const Eigen::Vector3d& point)
+        void add(const Eigen::Vector3d& point, int accumulated_pixel_count)
         {
             points.push_back(point);
             sum += point;
+            number_of_detected_pixels += accumulated_pixel_count;
         }
 
         Eigen::Vector3d mean() const
@@ -96,23 +100,6 @@ class ObjectPositionExtractorNode
             return sqrt(squared_diff_sum / points.size());
         }
 
-        int count() const
-        {
-            return points.size();
-        }
-
-        int count(double threshold) const
-        {
-            auto m = mean();
-
-            int count = 0;
-            for (const auto p : points)
-                if ((p - m).norm() < threshold)
-                    ++count;
-
-            return count;
-        }
-
         Eigen::Vector3d size(double threshold = std::numeric_limits<double>::infinity()) const 
         {
             auto m = mean();
 
@@ -97,6 +97,12 @@ ObjectPositionExtractor::Impl::Impl(
 
     //Verticies setup
     vao_.mapVariable(vbo_, glGetAttribLocation(program_.get(), "inputPixel"), 3, GL_FLOAT, 0);
+
+    //Enable blending
+    glEnable(GL_BLEND);
+    glBlendEquation(GL_FUNC_ADD);
+    glBlendFuncSeparatei(0, GL_ONE, GL_ONE , GL_ONE, GL_ONE);  //accumulate position
+    glBlendFuncSeparatei(1, GL_ONE, GL_ZERO, GL_ONE, GL_ZERO); //always overwrite color
 }
 
 void ObjectPositionExtractor::Impl::updateProjectionMatrix(