VoxNet: A 3D Convolutional Neural Network for Real-Time Object Recognition

VoxNet: A 3D Convolutional Neural Network for Real-Time Object Recognition. Maturana, D. & Scherer, S. Iros, 2015.

Robust object recognition is a crucial skill for robots operating autonomously in real world environments. Range sensors such as LiDAR and RGBD cameras are in- creasingly found in modern robotic systems, providing a rich source of 3D information that can aid in this task. However, many current systems do not fully utilize this information and have trouble efficiently dealing with large amounts of point cloud data. In this paper, we propose VoxNet, an architecture to tackle this problem by integrating a volumetric Occupancy Grid representation with a supervised 3D Convolutional Neural Network (3D CNN). We evaluate our approach on publicly available benchmarks using LiDAR, RGBD, and CAD data. VoxNet achieves accuracy beyond the state of the art while labeling hundreds of instances per second.

@article{
 title = {VoxNet: A 3D Convolutional Neural Network for Real-Time Object Recognition},
 type = {article},
 year = {2015},
 pages = {922-928},
 id = {2a9ae61b-a81e-3450-a78a-1b3df85504a8},
 created = {2020-10-01T13:48:35.417Z},
 file_attached = {true},
 profile_id = {bfbbf840-4c42-3914-a463-19024f50b30c},
 group_id = {1ff583c0-be37-34fa-9c04-73c69437d354},
 last_modified = {2021-01-28T08:25:30.932Z},
 read = {true},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 citation_key = {Maturana2015},
 folder_uuids = {a89f4866-a7e8-4ea9-aa98-e3f470892f7c},
 private_publication = {false},
 abstract = {Robust object recognition is a crucial skill for robots operating autonomously in real world environments. Range sensors such as LiDAR and RGBD cameras are in- creasingly found in modern robotic systems, providing a rich source of 3D information that can aid in this task. However, many current systems do not fully utilize this information and have trouble efficiently dealing with large amounts of point cloud data. In this paper, we propose VoxNet, an architecture to tackle this problem by integrating a volumetric Occupancy Grid representation with a supervised 3D Convolutional Neural Network (3D CNN). We evaluate our approach on publicly available benchmarks using LiDAR, RGBD, and CAD data. VoxNet achieves accuracy beyond the state of the art while labeling hundreds of instances per second.},
 bibtype = {article},
 author = {Maturana, Daniel and Scherer, Sebastian},
 doi = {10.1109/IROS.2015.7353481},
 journal = {Iros}
}

Downloads: 0

{"_id":"oEgGBmHyZNBxrGWT9","bibbaseid":"maturana-scherer-voxneta3dconvolutionalneuralnetworkforrealtimeobjectrecognition-2015","downloads":0,"creationDate":"2016-02-25T17:50:18.052Z","title":"VoxNet: A 3D Convolutional Neural Network for Real-Time Object Recognition","author_short":["Maturana, D.","Scherer, S."],"year":2015,"bibtype":"article","biburl":"https://bibbase.org/service/mendeley/bfbbf840-4c42-3914-a463-19024f50b30c","bibdata":{"title":"VoxNet: A 3D Convolutional Neural Network for Real-Time Object Recognition","type":"article","year":"2015","pages":"922-928","id":"2a9ae61b-a81e-3450-a78a-1b3df85504a8","created":"2020-10-01T13:48:35.417Z","file_attached":"true","profile_id":"bfbbf840-4c42-3914-a463-19024f50b30c","group_id":"1ff583c0-be37-34fa-9c04-73c69437d354","last_modified":"2021-01-28T08:25:30.932Z","read":"true","starred":false,"authored":false,"confirmed":"true","hidden":false,"citation_key":"Maturana2015","folder_uuids":"a89f4866-a7e8-4ea9-aa98-e3f470892f7c","private_publication":false,"abstract":"Robust object recognition is a crucial skill for robots operating autonomously in real world environments. Range sensors such as LiDAR and RGBD cameras are in- creasingly found in modern robotic systems, providing a rich source of 3D information that can aid in this task. However, many current systems do not fully utilize this information and have trouble efficiently dealing with large amounts of point cloud data. In this paper, we propose VoxNet, an architecture to tackle this problem by integrating a volumetric Occupancy Grid representation with a supervised 3D Convolutional Neural Network (3D CNN). We evaluate our approach on publicly available benchmarks using LiDAR, RGBD, and CAD data. VoxNet achieves accuracy beyond the state of the art while labeling hundreds of instances per second.","bibtype":"article","author":"Maturana, Daniel and Scherer, Sebastian","doi":"10.1109/IROS.2015.7353481","journal":"Iros","bibtex":"@article{\n title = {VoxNet: A 3D Convolutional Neural Network for Real-Time Object Recognition},\n type = {article},\n year = {2015},\n pages = {922-928},\n id = {2a9ae61b-a81e-3450-a78a-1b3df85504a8},\n created = {2020-10-01T13:48:35.417Z},\n file_attached = {true},\n profile_id = {bfbbf840-4c42-3914-a463-19024f50b30c},\n group_id = {1ff583c0-be37-34fa-9c04-73c69437d354},\n last_modified = {2021-01-28T08:25:30.932Z},\n read = {true},\n starred = {false},\n authored = {false},\n confirmed = {true},\n hidden = {false},\n citation_key = {Maturana2015},\n folder_uuids = {a89f4866-a7e8-4ea9-aa98-e3f470892f7c},\n private_publication = {false},\n abstract = {Robust object recognition is a crucial skill for robots operating autonomously in real world environments. Range sensors such as LiDAR and RGBD cameras are in- creasingly found in modern robotic systems, providing a rich source of 3D information that can aid in this task. However, many current systems do not fully utilize this information and have trouble efficiently dealing with large amounts of point cloud data. In this paper, we propose VoxNet, an architecture to tackle this problem by integrating a volumetric Occupancy Grid representation with a supervised 3D Convolutional Neural Network (3D CNN). We evaluate our approach on publicly available benchmarks using LiDAR, RGBD, and CAD data. VoxNet achieves accuracy beyond the state of the art while labeling hundreds of instances per second.},\n bibtype = {article},\n author = {Maturana, Daniel and Scherer, Sebastian},\n doi = {10.1109/IROS.2015.7353481},\n journal = {Iros}\n}","author_short":["Maturana, D.","Scherer, S."],"urls":{"Paper":"https://bibbase.org/service/mendeley/bfbbf840-4c42-3914-a463-19024f50b30c/file/413d65a2-edc0-9efb-67e7-70e61d778fae/voxnet_maturana_scherer_iros15.pdf.pdf"},"biburl":"https://bibbase.org/service/mendeley/bfbbf840-4c42-3914-a463-19024f50b30c","bibbaseid":"maturana-scherer-voxneta3dconvolutionalneuralnetworkforrealtimeobjectrecognition-2015","role":"author","metadata":{"authorlinks":{}},"downloads":0},"search_terms":["voxnet","convolutional","neural","network","real","time","object","recognition","maturana","scherer"],"keywords":[],"authorIDs":[],"dataSources":["h2ykM5EjvLWRGkzH2","ya2CyA73rpZseyrZ8","2252seNhipfTmjEBQ"]}