Explicit and Implicit Box Equivariance Learning for Weakly-Supervised Rotated Object Detection. Wang, L., Zhan, Y., Lin, X., Yu, B., Ding, L., Zhu, J., & Tao, D. IEEE Transactions on Emerging Topics in Computational Intelligence, Institute of Electrical and Electronics Engineers Inc., 2024. Paper doi abstract bibtex Rotated object detection has emerged as a preferred alternative to the conventional Horizontal Box (HBox) object detection in various tasks. However, the majority of existing detection datasets are still annotated using HBox. Re-annotating these datasets for rotated object detection is notably inefficient and labor-intensive. Recently, weakly-supervised detectors based directly on HBox have provided a solution to bridge the gap between the rotated bounding box (RBox) prediction and the weak annotations. Nonetheless, they tend to overlook the potential impact of factors such as bounding box position, aspect ratio, and scale on angle prediction. Additionally, inconsistencies arise when evaluating rotation variations, hindering the inference performance. In light of these limitations, we propose an explicit and implicit equivariance detector (EIE-Det) to predict fine-grained RBox based on HBox annotations. Along with a shared backbone and neck structure, our proposed EIE-Det comprises a weakly supervised (WS) branch for predicting coarse RBox from HBox labels, an explicit equivariance (EE) branch for learning rotation consistency, and an implicit equivariance (IE) branch for learning position, aspect ratio, and scale consistency. Furthermore, we introduce the Tanimoto Coefficient for vector-based bounding box regression, enabling a comprehensive assessment of model prediction bias, thereby eliminating interference from variations in box aspect ratio and scale. Experiments demonstrate that our method not only significantly surpasses state-of-the-art models supervised with HBox but also achieves accuracy comparable to fully-supervised detectors (75.74$\%$ and 58.50$\%$ $AP_50$ on DOTA and DIOR-R, respectively).
@article{
title = {Explicit and Implicit Box Equivariance Learning for Weakly-Supervised Rotated Object Detection},
type = {article},
year = {2024},
keywords = {Annotations,Box equivariance,Detectors,Feature extraction,Neck,Object detection,Shape,Task analysis,rotated object detection,weakly-supervised learning},
publisher = {Institute of Electrical and Electronics Engineers Inc.},
id = {9ead5ef3-c321-3e7c-91c0-8ede06c3d8a3},
created = {2024-07-03T09:39:40.891Z},
accessed = {2024-07-03},
file_attached = {true},
profile_id = {f1f70cad-e32d-3de2-a3c0-be1736cb88be},
group_id = {5ec9cc91-a5d6-3de5-82f3-3ef3d98a89c1},
last_modified = {2024-07-03T09:40:04.337Z},
read = {false},
starred = {false},
authored = {false},
confirmed = {false},
hidden = {false},
folder_uuids = {df28411a-ed7f-4991-8358-d39685eb4bf0},
private_publication = {false},
abstract = {Rotated object detection has emerged as a preferred alternative to the conventional Horizontal Box (HBox) object detection in various tasks. However, the majority of existing detection datasets are still annotated using HBox. Re-annotating these datasets for rotated object detection is notably inefficient and labor-intensive. Recently, weakly-supervised detectors based directly on HBox have provided a solution to bridge the gap between the rotated bounding box (RBox) prediction and the weak annotations. Nonetheless, they tend to overlook the potential impact of factors such as bounding box position, aspect ratio, and scale on angle prediction. Additionally, inconsistencies arise when evaluating rotation variations, hindering the inference performance. In light of these limitations, we propose an explicit and implicit equivariance detector (EIE-Det) to predict fine-grained RBox based on HBox annotations. Along with a shared backbone and neck structure, our proposed EIE-Det comprises a weakly supervised (WS) branch for predicting coarse RBox from HBox labels, an explicit equivariance (EE) branch for learning rotation consistency, and an implicit equivariance (IE) branch for learning position, aspect ratio, and scale consistency. Furthermore, we introduce the Tanimoto Coefficient for vector-based bounding box regression, enabling a comprehensive assessment of model prediction bias, thereby eliminating interference from variations in box aspect ratio and scale. Experiments demonstrate that our method not only significantly surpasses state-of-the-art models supervised with HBox but also achieves accuracy comparable to fully-supervised detectors (75.74<inline-formula><tex-math notation="LaTeX">$\%$</tex-math></inline-formula> and 58.50<inline-formula><tex-math notation="LaTeX">$\%$</tex-math></inline-formula> <inline-formula><tex-math notation="LaTeX">$AP_50$</tex-math></inline-formula> on DOTA and DIOR-R, respectively).},
bibtype = {article},
author = {Wang, Linfei and Zhan, Yibing and Lin, Xu and Yu, Baosheng and Ding, Liang and Zhu, Jianqing and Tao, Dapeng},
doi = {10.1109/TETCI.2024.3398020},
journal = {IEEE Transactions on Emerging Topics in Computational Intelligence}
}
Downloads: 0
{"_id":"BByRLBxDJyENGSZPw","bibbaseid":"wang-zhan-lin-yu-ding-zhu-tao-explicitandimplicitboxequivariancelearningforweaklysupervisedrotatedobjectdetection-2024","author_short":["Wang, L.","Zhan, Y.","Lin, X.","Yu, B.","Ding, L.","Zhu, J.","Tao, D."],"bibdata":{"title":"Explicit and Implicit Box Equivariance Learning for Weakly-Supervised Rotated Object Detection","type":"article","year":"2024","keywords":"Annotations,Box equivariance,Detectors,Feature extraction,Neck,Object detection,Shape,Task analysis,rotated object detection,weakly-supervised learning","publisher":"Institute of Electrical and Electronics Engineers Inc.","id":"9ead5ef3-c321-3e7c-91c0-8ede06c3d8a3","created":"2024-07-03T09:39:40.891Z","accessed":"2024-07-03","file_attached":"true","profile_id":"f1f70cad-e32d-3de2-a3c0-be1736cb88be","group_id":"5ec9cc91-a5d6-3de5-82f3-3ef3d98a89c1","last_modified":"2024-07-03T09:40:04.337Z","read":false,"starred":false,"authored":false,"confirmed":false,"hidden":false,"folder_uuids":"df28411a-ed7f-4991-8358-d39685eb4bf0","private_publication":false,"abstract":"Rotated object detection has emerged as a preferred alternative to the conventional Horizontal Box (HBox) object detection in various tasks. However, the majority of existing detection datasets are still annotated using HBox. Re-annotating these datasets for rotated object detection is notably inefficient and labor-intensive. Recently, weakly-supervised detectors based directly on HBox have provided a solution to bridge the gap between the rotated bounding box (RBox) prediction and the weak annotations. Nonetheless, they tend to overlook the potential impact of factors such as bounding box position, aspect ratio, and scale on angle prediction. Additionally, inconsistencies arise when evaluating rotation variations, hindering the inference performance. In light of these limitations, we propose an explicit and implicit equivariance detector (EIE-Det) to predict fine-grained RBox based on HBox annotations. Along with a shared backbone and neck structure, our proposed EIE-Det comprises a weakly supervised (WS) branch for predicting coarse RBox from HBox labels, an explicit equivariance (EE) branch for learning rotation consistency, and an implicit equivariance (IE) branch for learning position, aspect ratio, and scale consistency. Furthermore, we introduce the Tanimoto Coefficient for vector-based bounding box regression, enabling a comprehensive assessment of model prediction bias, thereby eliminating interference from variations in box aspect ratio and scale. Experiments demonstrate that our method not only significantly surpasses state-of-the-art models supervised with HBox but also achieves accuracy comparable to fully-supervised detectors (75.74<inline-formula><tex-math notation=\"LaTeX\">$\\%$</tex-math></inline-formula> and 58.50<inline-formula><tex-math notation=\"LaTeX\">$\\%$</tex-math></inline-formula> <inline-formula><tex-math notation=\"LaTeX\">$AP_50$</tex-math></inline-formula> on DOTA and DIOR-R, respectively).","bibtype":"article","author":"Wang, Linfei and Zhan, Yibing and Lin, Xu and Yu, Baosheng and Ding, Liang and Zhu, Jianqing and Tao, Dapeng","doi":"10.1109/TETCI.2024.3398020","journal":"IEEE Transactions on Emerging Topics in Computational Intelligence","bibtex":"@article{\n title = {Explicit and Implicit Box Equivariance Learning for Weakly-Supervised Rotated Object Detection},\n type = {article},\n year = {2024},\n keywords = {Annotations,Box equivariance,Detectors,Feature extraction,Neck,Object detection,Shape,Task analysis,rotated object detection,weakly-supervised learning},\n publisher = {Institute of Electrical and Electronics Engineers Inc.},\n id = {9ead5ef3-c321-3e7c-91c0-8ede06c3d8a3},\n created = {2024-07-03T09:39:40.891Z},\n accessed = {2024-07-03},\n file_attached = {true},\n profile_id = {f1f70cad-e32d-3de2-a3c0-be1736cb88be},\n group_id = {5ec9cc91-a5d6-3de5-82f3-3ef3d98a89c1},\n last_modified = {2024-07-03T09:40:04.337Z},\n read = {false},\n starred = {false},\n authored = {false},\n confirmed = {false},\n hidden = {false},\n folder_uuids = {df28411a-ed7f-4991-8358-d39685eb4bf0},\n private_publication = {false},\n abstract = {Rotated object detection has emerged as a preferred alternative to the conventional Horizontal Box (HBox) object detection in various tasks. However, the majority of existing detection datasets are still annotated using HBox. Re-annotating these datasets for rotated object detection is notably inefficient and labor-intensive. Recently, weakly-supervised detectors based directly on HBox have provided a solution to bridge the gap between the rotated bounding box (RBox) prediction and the weak annotations. Nonetheless, they tend to overlook the potential impact of factors such as bounding box position, aspect ratio, and scale on angle prediction. Additionally, inconsistencies arise when evaluating rotation variations, hindering the inference performance. In light of these limitations, we propose an explicit and implicit equivariance detector (EIE-Det) to predict fine-grained RBox based on HBox annotations. Along with a shared backbone and neck structure, our proposed EIE-Det comprises a weakly supervised (WS) branch for predicting coarse RBox from HBox labels, an explicit equivariance (EE) branch for learning rotation consistency, and an implicit equivariance (IE) branch for learning position, aspect ratio, and scale consistency. Furthermore, we introduce the Tanimoto Coefficient for vector-based bounding box regression, enabling a comprehensive assessment of model prediction bias, thereby eliminating interference from variations in box aspect ratio and scale. Experiments demonstrate that our method not only significantly surpasses state-of-the-art models supervised with HBox but also achieves accuracy comparable to fully-supervised detectors (75.74<inline-formula><tex-math notation=\"LaTeX\">$\\%$</tex-math></inline-formula> and 58.50<inline-formula><tex-math notation=\"LaTeX\">$\\%$</tex-math></inline-formula> <inline-formula><tex-math notation=\"LaTeX\">$AP_50$</tex-math></inline-formula> on DOTA and DIOR-R, respectively).},\n bibtype = {article},\n author = {Wang, Linfei and Zhan, Yibing and Lin, Xu and Yu, Baosheng and Ding, Liang and Zhu, Jianqing and Tao, Dapeng},\n doi = {10.1109/TETCI.2024.3398020},\n journal = {IEEE Transactions on Emerging Topics in Computational Intelligence}\n}","author_short":["Wang, L.","Zhan, Y.","Lin, X.","Yu, B.","Ding, L.","Zhu, J.","Tao, D."],"urls":{"Paper":"https://bibbase.org/service/mendeley/bfbbf840-4c42-3914-a463-19024f50b30c/file/46d54a9c-8900-99ff-3b0d-b1e8e1f99c4a/full_text.pdf.pdf"},"biburl":"https://bibbase.org/service/mendeley/bfbbf840-4c42-3914-a463-19024f50b30c","bibbaseid":"wang-zhan-lin-yu-ding-zhu-tao-explicitandimplicitboxequivariancelearningforweaklysupervisedrotatedobjectdetection-2024","role":"author","keyword":["Annotations","Box equivariance","Detectors","Feature extraction","Neck","Object detection","Shape","Task analysis","rotated object detection","weakly-supervised learning"],"metadata":{"authorlinks":{}},"downloads":0},"bibtype":"article","biburl":"https://bibbase.org/service/mendeley/bfbbf840-4c42-3914-a463-19024f50b30c","dataSources":["2252seNhipfTmjEBQ"],"keywords":["annotations","box equivariance","detectors","feature extraction","neck","object detection","shape","task analysis","rotated object detection","weakly-supervised learning"],"search_terms":["explicit","implicit","box","equivariance","learning","weakly","supervised","rotated","object","detection","wang","zhan","lin","yu","ding","zhu","tao"],"title":"Explicit and Implicit Box Equivariance Learning for Weakly-Supervised Rotated Object Detection","year":2024}