-
Notifications
You must be signed in to change notification settings - Fork 1
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
0 parents
commit 7d8fd9d
Showing
6 changed files
with
369 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1 @@ | ||
.vscode/ |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,102 @@ | ||
cmake_minimum_required(VERSION 2.8.3) | ||
project(compressed_image_viewer) | ||
|
||
add_compile_options(-std=c++14) | ||
|
||
find_package(catkin REQUIRED COMPONENTS | ||
cv_bridge | ||
image_transport | ||
roscpp | ||
rospy | ||
sensor_msgs | ||
std_msgs | ||
) | ||
|
||
find_package(OpenCV 4 REQUIRED) | ||
|
||
# catkin_python_setup() | ||
|
||
## Generate messages in the 'msg' folder | ||
# add_message_files( | ||
# FILES | ||
# Message1.msg | ||
# Message2.msg | ||
# ) | ||
|
||
## Generate services in the 'srv' folder | ||
# add_service_files( | ||
# FILES | ||
# Service1.srv | ||
# Service2.srv | ||
# ) | ||
|
||
## Generate actions in the 'action' folder | ||
# add_action_files( | ||
# FILES | ||
# Action1.action | ||
# Action2.action | ||
# ) | ||
|
||
## Generate added messages and services with any dependencies listed here | ||
# generate_messages( | ||
# DEPENDENCIES | ||
# sensor_msgs# std_msgs | ||
# ) | ||
|
||
################################### | ||
## catkin specific configuration ## | ||
################################### | ||
## The catkin_package macro generates cmake config files for your package | ||
## Declare things to be passed to dependent projects | ||
## INCLUDE_DIRS: uncomment this if your package contains header files | ||
## LIBRARIES: libraries you create in this project that dependent projects also need | ||
## CATKIN_DEPENDS: catkin_packages dependent projects also need | ||
## DEPENDS: system dependencies of this project that dependent projects also need | ||
catkin_package( | ||
# INCLUDE_DIRS include | ||
# LIBRARIES compressed_image_viewer | ||
# CATKIN_DEPENDS cv_bridge image_transport roscpp rospy sensor_msgs std_msgs | ||
# DEPENDS system_lib | ||
) | ||
|
||
########### | ||
## Build ## | ||
########### | ||
|
||
## Specify additional locations of header files | ||
## Your package locations should be listed before other locations | ||
include_directories( | ||
include | ||
${catkin_INCLUDE_DIRS} | ||
${OpenCV_INCLUDE_DIRS} | ||
) | ||
|
||
## Declare a C++ library | ||
# add_library(${PROJECT_NAME} | ||
# src/${PROJECT_NAME}/compressed_image_viewer.cpp | ||
# ) | ||
|
||
## Add cmake target dependencies of the library | ||
## as an example, code may need to be generated before libraries | ||
## either from message generation or dynamic reconfigure | ||
# add_dependencies(${PROJECT_NAME} ${${PROJECT_NAME}_EXPORTED_TARGETS} ${catkin_EXPORTED_TARGETS}) | ||
|
||
add_executable(compressed_image_viewer src/compressed_image_viewer.cpp) | ||
|
||
target_link_libraries(compressed_image_viewer | ||
${catkin_LIBRARIES} | ||
${OpenCV_LIBRARIES} | ||
) | ||
|
||
############# | ||
## Testing ## | ||
############# | ||
|
||
## Add gtest based cpp test target and link libraries | ||
# catkin_add_gtest(${PROJECT_NAME}-test test/test_compressed_image_viewer.cpp) | ||
# if(TARGET ${PROJECT_NAME}-test) | ||
# target_link_libraries(${PROJECT_NAME}-test ${PROJECT_NAME}) | ||
# endif() | ||
|
||
## Add folders to be run by python nosetests | ||
# catkin_add_nosetests(test) |
Binary file not shown.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,77 @@ | ||
<?xml version="1.0"?> | ||
<package format="2"> | ||
<name>compressed_image_viewer</name> | ||
<version>0.0.0</version> | ||
<description>The compressed_image_viewer package</description> | ||
|
||
<!-- One maintainer tag required, multiple allowed, one person per tag --> | ||
<!-- Example: --> | ||
<!-- <maintainer email="jane.doe@example.com">Jane Doe</maintainer> --> | ||
<maintainer email="sayter@todo.todo">sayter</maintainer> | ||
|
||
|
||
<!-- One license tag required, multiple allowed, one license per tag --> | ||
<!-- Commonly used license strings: --> | ||
<!-- BSD, MIT, Boost Software License, GPLv2, GPLv3, LGPLv2.1, LGPLv3 --> | ||
<license>TODO</license> | ||
|
||
|
||
<!-- Url tags are optional, but multiple are allowed, one per tag --> | ||
<!-- Optional attribute type can be: website, bugtracker, or repository --> | ||
<!-- Example: --> | ||
<!-- <url type="website">http://wiki.ros.org/compressed_image_viewer</url> --> | ||
|
||
|
||
<!-- Author tags are optional, multiple are allowed, one per tag --> | ||
<!-- Authors do not have to be maintainers, but could be --> | ||
<!-- Example: --> | ||
<!-- <author email="jane.doe@example.com">Jane Doe</author> --> | ||
|
||
|
||
<!-- The *depend tags are used to specify dependencies --> | ||
<!-- Dependencies can be catkin packages or system dependencies --> | ||
<!-- Examples: --> | ||
<!-- Use depend as a shortcut for packages that are both build and exec dependencies --> | ||
<!-- <depend>roscpp</depend> --> | ||
<!-- Note that this is equivalent to the following: --> | ||
<!-- <build_depend>roscpp</build_depend> --> | ||
<!-- <exec_depend>roscpp</exec_depend> --> | ||
<!-- Use build_depend for packages you need at compile time: --> | ||
<!-- <build_depend>message_generation</build_depend> --> | ||
<!-- Use build_export_depend for packages you need in order to build against this package: --> | ||
<!-- <build_export_depend>message_generation</build_export_depend> --> | ||
<!-- Use buildtool_depend for build tool packages: --> | ||
<!-- <buildtool_depend>catkin</buildtool_depend> --> | ||
<!-- Use exec_depend for packages you need at runtime: --> | ||
<!-- <exec_depend>message_runtime</exec_depend> --> | ||
<!-- Use test_depend for packages you need only for testing: --> | ||
<!-- <test_depend>gtest</test_depend> --> | ||
<!-- Use doc_depend for packages you need only for building documentation: --> | ||
<!-- <doc_depend>doxygen</doc_depend> --> | ||
<buildtool_depend>catkin</buildtool_depend> | ||
<build_depend>cv_bridge</build_depend> | ||
<build_depend>image_transport</build_depend> | ||
<build_depend>roscpp</build_depend> | ||
<build_depend>rospy</build_depend> | ||
<build_depend>sensor_msgs</build_depend> | ||
<build_depend>std_msgs</build_depend> | ||
<build_export_depend>cv_bridge</build_export_depend> | ||
<build_export_depend>image_transport</build_export_depend> | ||
<build_export_depend>roscpp</build_export_depend> | ||
<build_export_depend>rospy</build_export_depend> | ||
<build_export_depend>sensor_msgs</build_export_depend> | ||
<build_export_depend>std_msgs</build_export_depend> | ||
<exec_depend>cv_bridge</exec_depend> | ||
<exec_depend>image_transport</exec_depend> | ||
<exec_depend>roscpp</exec_depend> | ||
<exec_depend>rospy</exec_depend> | ||
<exec_depend>sensor_msgs</exec_depend> | ||
<exec_depend>std_msgs</exec_depend> | ||
|
||
|
||
<!-- The export tag contains other, unspecified, tags --> | ||
<export> | ||
<!-- Other tools can request additional information be placed here --> | ||
|
||
</export> | ||
</package> |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,157 @@ | ||
#!/usr/bin/env python3 | ||
import cv2 | ||
import rospy | ||
import rospkg | ||
import numpy as np | ||
import onnx | ||
import onnxruntime as ort | ||
from onnx_tf.backend import prepare | ||
from sensor_msgs.msg import CompressedImage | ||
|
||
def area_of(left_top, right_bottom): | ||
""" | ||
Compute the areas of rectangles given two corners. | ||
Args: | ||
left_top (N, 2): left top corner. | ||
right_bottom (N, 2): right bottom corner. | ||
Returns: | ||
area (N): return the area. | ||
""" | ||
hw = np.clip(right_bottom - left_top, 0.0, None) | ||
return hw[..., 0] * hw[..., 1] | ||
|
||
def iou_of(boxes0, boxes1, eps=1e-5): | ||
""" | ||
Return intersection-over-union (Jaccard index) of boxes. | ||
Args: | ||
boxes0 (N, 4): ground truth boxes. | ||
boxes1 (N or 1, 4): predicted boxes. | ||
eps: a small number to avoid 0 as denominator. | ||
Returns: | ||
iou (N): IoU values. | ||
""" | ||
overlap_left_top = np.maximum(boxes0[..., :2], boxes1[..., :2]) | ||
overlap_right_bottom = np.minimum(boxes0[..., 2:], boxes1[..., 2:]) | ||
|
||
overlap_area = area_of(overlap_left_top, overlap_right_bottom) | ||
area0 = area_of(boxes0[..., :2], boxes0[..., 2:]) | ||
area1 = area_of(boxes1[..., :2], boxes1[..., 2:]) | ||
return overlap_area / (area0 + area1 - overlap_area + eps) | ||
|
||
def hard_nms(box_scores, iou_threshold, top_k=-1, candidate_size=200): | ||
""" | ||
Perform hard non-maximum-supression to filter out boxes with iou greater | ||
than threshold | ||
Args: | ||
box_scores (N, 5): boxes in corner-form and probabilities. | ||
iou_threshold: intersection over union threshold. | ||
top_k: keep top_k results. If k <= 0, keep all the results. | ||
candidate_size: only consider the candidates with the highest scores. | ||
Returns: | ||
picked: a list of indexes of the kept boxes | ||
""" | ||
scores = box_scores[:, -1] | ||
boxes = box_scores[:, :-1] | ||
picked = [] | ||
indexes = np.argsort(scores) | ||
indexes = indexes[-candidate_size:] | ||
while len(indexes) > 0: | ||
current = indexes[-1] | ||
picked.append(current) | ||
if 0 < top_k == len(picked) or len(indexes) == 1: | ||
break | ||
current_box = boxes[current, :] | ||
indexes = indexes[:-1] | ||
rest_boxes = boxes[indexes, :] | ||
iou = iou_of( | ||
rest_boxes, | ||
np.expand_dims(current_box, axis=0), | ||
) | ||
indexes = indexes[iou <= iou_threshold] | ||
|
||
return box_scores[picked, :] | ||
|
||
def predict(width, height, confidences, boxes, prob_threshold, iou_threshold=0.5, top_k=-1): | ||
""" | ||
Select boxes that contain human faces | ||
Args: | ||
width: original image width | ||
height: original image height | ||
confidences (N, 2): confidence array | ||
boxes (N, 4): boxes array in corner-form | ||
iou_threshold: intersection over union threshold. | ||
top_k: keep top_k results. If k <= 0, keep all the results. | ||
Returns: | ||
boxes (k, 4): an array of boxes kept | ||
labels (k): an array of labels for each boxes kept | ||
probs (k): an array of probabilities for each boxes being in corresponding labels | ||
""" | ||
boxes = boxes[0] | ||
confidences = confidences[0] | ||
picked_box_probs = [] | ||
picked_labels = [] | ||
for class_index in range(1, confidences.shape[1]): | ||
probs = confidences[:, class_index] | ||
mask = probs > prob_threshold | ||
probs = probs[mask] | ||
if probs.shape[0] == 0: | ||
continue | ||
subset_boxes = boxes[mask, :] | ||
box_probs = np.concatenate([subset_boxes, probs.reshape(-1, 1)], axis=1) | ||
box_probs = hard_nms(box_probs, | ||
iou_threshold=iou_threshold, | ||
top_k=top_k, | ||
) | ||
picked_box_probs.append(box_probs) | ||
picked_labels.extend([class_index] * box_probs.shape[0]) | ||
if not picked_box_probs: | ||
return np.array([]), np.array([]), np.array([]) | ||
picked_box_probs = np.concatenate(picked_box_probs) | ||
picked_box_probs[:, 0] *= width | ||
picked_box_probs[:, 1] *= height | ||
picked_box_probs[:, 2] *= width | ||
picked_box_probs[:, 3] *= height | ||
return picked_box_probs[:, :4].astype(np.int32), np.array(picked_labels), picked_box_probs[:, 4] | ||
|
||
class face_detection(): | ||
def __init__(self): | ||
rospy.init_node('face_detection', anonymous=True) | ||
pkg_path = rospkg.RosPack().get_path('compressed_image_viewer') | ||
self.onnx_path = pkg_path + '/onnx/ultra_light_640.onnx' | ||
self.onnx_model = onnx.load(self.onnx_path) | ||
# onnx.checker.check_model(self.onnx_model) | ||
# onnx.helper.printable_graph(self.onnx_model.graph) | ||
self.predictor = prepare(self.onnx_model) | ||
self.ort_session = ort.InferenceSession(self.onnx_path) | ||
self.input_name = self.ort_session.get_inputs()[0].name | ||
rospy.Subscriber('/camera/rgb/image_rect_color/compressed', CompressedImage, self.compressedCallback) | ||
|
||
def compressedCallback(self, image): | ||
encoded_data = np.fromstring(image.data, np.uint8) | ||
decoded_image = cv2.imdecode(encoded_data, cv2.IMREAD_UNCHANGED) | ||
h, w, _ = decoded_image.shape | ||
preprocessed_image = cv2.cvtColor(decoded_image, cv2.COLOR_BGR2RGB) | ||
mean = np.array([127, 127, 127]) | ||
preprocessed_image = (preprocessed_image - mean) / 128 | ||
preprocessed_image = np.transpose(preprocessed_image, [2, 0, 1]) | ||
preprocessed_image = np.expand_dims(preprocessed_image, axis=0) | ||
preprocessed_image = preprocessed_image.astype(np.float32) | ||
confidences, boxes = self.ort_session.run(None, {self.input_name: preprocessed_image}) | ||
boxes, labels, probs = predict(w, h, confidences, boxes, 0.7) | ||
for i in range(boxes.shape[0]): | ||
box = boxes[i, :] | ||
x1, y1, x2, y2 = box | ||
cv2.rectangle(decoded_image, (x1, y1), (x2, y2), (80,18,236), 2) | ||
cv2.rectangle(decoded_image, (x1, y2 - 20), (x2, y2), (80,18,236), cv2.FILLED) | ||
font = cv2.FONT_HERSHEY_DUPLEX | ||
text = f"face: {labels[i]}" | ||
cv2.putText(decoded_image, text, (x1 + 6, y2 - 6), font, 0.5, (255, 255, 255), 1) | ||
cv2.imshow('compressed', decoded_image) | ||
cv2.waitKey(1) | ||
|
||
def start(self): | ||
rospy.spin() | ||
|
||
if __name__ == '__main__': | ||
face_detection = face_detection() | ||
face_detection.start() |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,32 @@ | ||
#include <ros/ros.h> | ||
#include <image_transport/image_transport.h> | ||
#include <cv_bridge/cv_bridge.h> | ||
#include <sensor_msgs/image_encodings.h> | ||
#include <opencv2/imgproc/imgproc.hpp> | ||
#include <opencv2/highgui/highgui.hpp> | ||
#include <vector> | ||
|
||
void imageCb(const sensor_msgs::CompressedImageConstPtr& msg) | ||
{ | ||
try | ||
{ | ||
cv::Mat image = cv::imdecode(cv::Mat(msg->data), cv::IMREAD_UNCHANGED); | ||
cv::imshow("compressed", image); | ||
cv::waitKey(10); | ||
} | ||
catch (cv_bridge::Exception& e) | ||
{ | ||
ROS_ERROR("cv_bridge exception: %s", e.what()); | ||
} | ||
} | ||
|
||
|
||
int main(int argc, char** argv) | ||
{ | ||
ros::init(argc, argv, "compressed_image_viewer"); | ||
ros::NodeHandle n; | ||
ros::Subscriber depth_image_sub = n.subscribe("/camera/rgb/image_rect_color/compressed", 30, imageCb); | ||
|
||
ros::spin(); | ||
return 0; | ||
} |