diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..c21e549 --- /dev/null +++ b/.gitignore @@ -0,0 +1,8 @@ +.DS_STORE +/saved +/logs +/data/semantic_kitti +/.vscode +.python-version +__pycache__/ +*.out diff --git a/README.md b/README.md new file mode 100644 index 0000000..96eedd6 --- /dev/null +++ b/README.md @@ -0,0 +1,101 @@ +# MASK4D: Mask Transformer for 4D Panoptic Segmentation +
+ TL;DR: Mask4D is a transformer-based model for 4D Panoptic Segmentation, achieving a new + state-of-the-art performance on the SemanticKITTI test set. +
++ Accurately perceiving and tracking instances over time is essential for the decision-making processes of + autonomous agents interacting safely in dynamic environments. + With this intention, we propose Mask4D for the challenging task of 4D panoptic segmentation of LiDAR point + clouds. +
++ Mask4D is the first transformer-based approach unifying semantic instance segmentation and tracking of + sparse and irregular sequences of 3D point clouds into a single joint model. + Our model directly predicts semantic instances and their temporal associations without relying on any + hand-crafted non-learned association strategies such as probabilistic clustering or voting-based center + prediction. + Instead, Mask4D introduces spatio-temporal instance queries which encode the semantic and geometric + properties of each semantic tracklet in the sequence. +
++ In an in-depth study, we find that it is critical to promote spatially compact instance predictions as + spatio-temporal instance queries tend to merge multiple semantically similar instances, even if they are + spatially distant. + To this end, we regress 6-DOF bounding box parameters from spatio-temporal instance queries, which is used + as an auxiliary task to foster spatially compact predictions. +
++ Mask4D achieves a new state-of-the-art on the SemanticKITTI test set with a score of 68.4 LSTQ, improving + upon published top-performing methods by at least +4.5\%. +
+@article{yilmaz2023mask4d,
+ title = {{Mask4D: Mask Transformer for 4D Panoptic Segmentation}},
+ author = {Yilmaz, Kadir and Schult, Jonas and Nekrasov, Alexey and Leibe, Bastian},
+ journal = {arXiv prepring arXiv:2309.16133},
+ year = {2023}
+ }
+