{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,4]],"date-time":"2026-02-04T18:12:43Z","timestamp":1770228763681,"version":"3.49.0"},"reference-count":49,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,5,29]],"date-time":"2023-05-29T00:00:00Z","timestamp":1685318400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/2.zoppoz.workers.dev:443\/https\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,5,29]],"date-time":"2023-05-29T00:00:00Z","timestamp":1685318400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/2.zoppoz.workers.dev:443\/https\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"NSFC","doi-asserted-by":"publisher","award":["62206173"],"award-info":[{"award-number":["62206173"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,5,29]]},"DOI":"10.1109\/icra48891.2023.10161552","type":"proceedings-article","created":{"date-parts":[[2023,7,4]],"date-time":"2023-07-04T17:20:56Z","timestamp":1688491256000},"page":"5602-5609","source":"Crossref","is-referenced-by-count":6,"title":["One Training for Multiple Deployments: Polar-based Adaptive BEV Perception for Autonomous Driving"],"prefix":"10.1109","author":[{"given":"Huitong","family":"Yang","sequence":"first","affiliation":[{"name":"School of Information Science and Technology, ShanghaiTech University,Shanghai,China,201210"}]},{"given":"Xuyang","family":"Bai","sequence":"additional","affiliation":[{"name":"Hong Kong University of Science and Technology,Department of Computer Science and Engineering"}]},{"given":"Xinge","family":"Zhu","sequence":"additional","affiliation":[{"name":"The Chinese University of Hong Kong,Department of Information Engineering"}]},{"given":"Yuexin","family":"Ma","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, ShanghaiTech University,Shanghai,China,201210"}]}],"member":"263","reference":[{"key":"ref13","article-title":"Hdmapnet: An online hd map construction and evaluation framework","author":"li","year":"2021","journal-title":"ArXiv"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/IVS.2019.8814050"},{"key":"ref15","article-title":"BEVFormer: Learning Bird's-Eye-View Representation from Multi-Camera Images via Spatiotemporal Transformers","author":"li","year":"2022","journal-title":"ArXiv"},{"key":"ref14","article-title":"BEVDepth: Acquisition of Reliable Depth for Multi-view 3D Object Detection","author":"li","year":"2022","journal-title":"CoRR"},{"key":"ref11","article-title":"PolarFormer: Multi-camera 3D Object Detection with Polar Transformers","author":"jiang","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00090"},{"key":"ref17","article-title":"Petr: Position embedding transfor-mation for multi-view 3d object detection","author":"liu","year":"2022","journal-title":"ArXiv"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00134"},{"key":"ref19","author":"liu","year":"2022","journal-title":"Vision-based Uneven BEV Representation Learning with Polar Rasterization and Surface Estimation"},{"key":"ref18","article-title":"PETRv2: A Unified Framework for 3D Perception from Multi-Camera Images","author":"liu","year":"2022","journal-title":"ArXiv"},{"key":"ref46","article-title":"Monocular 3D Vehicle Detection Using Uncalibrated Traffic Cameras through Homog-raphy","author":"zhu","year":"2021","journal-title":"IROS"},{"key":"ref45","article-title":"Class-balanced Grouping and Sam-pling for Point Cloud 3D Object Detection","volume":"abs 1908 9492","author":"zhu","year":"2019","journal-title":"CoRR"},{"key":"ref48","article-title":"SSN: Shape Signature Networks for Multi-class Object Detection from Point Clouds","author":"zhu","year":"2020","journal-title":"ECCV"},{"key":"ref47","article-title":"Cylindrical and asymmetrical 3d convolution networks for lidar-based perception","author":"zhu","year":"2021","journal-title":"TPAMI"},{"key":"ref42","article-title":"BEVerse: Unified Perception and Prediction in Birds-Eye-View for Vision-Centric Autonomous Driving","author":"zhang","year":"2022","journal-title":"ArXiv"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01161"},{"key":"ref44","article-title":"Objects as Points","volume":"abs 1904 7850","author":"zhou","year":"2019","journal-title":"CoRR"},{"key":"ref43","article-title":"PersDet: Monocular 3D De-tection in Perspective Bird's-Eye-View","volume":"abs 2208 9394","author":"zhou","year":"2022","journal-title":"CoRR"},{"key":"ref49","article-title":"HFT: Lifting Perspective Represen-tations via Hybrid Feature Transformation","author":"zou","year":"2022","journal-title":"ArXiv"},{"key":"ref8","article-title":"FISHING Net: Future In-ference of Semantic Heatmaps In Grids","volume":"abs 2006 9917","author":"hendy","year":"2020","journal-title":"ArXiv"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2022.3142418"},{"key":"ref9","article-title":"BEVDet: High-performance Multi-camera 3D Object Detection in Bird-Eye-View","volume":"abs 2112 11790","author":"huang","year":"2021","journal-title":"CoRR"},{"key":"ref4","first-page":"3302","article-title":"Understanding bird's-eye view of road semantics using an onboard camera","volume":"7 2","author":"baran can","year":"2022","journal-title":"IEEE l of Robotics and Automation"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01164"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00301"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01899"},{"key":"ref40","first-page":"15536","article-title":"Projecting your view at-tentively: Monocular road scene layout estimation via cross-view transformation","author":"yang","year":"2021","journal-title":"CVPR"},{"key":"ref35","first-page":"857","article-title":"Automatic dense visual se-mantic mapping from street-level imagery","author":"sengupta","year":"2012","journal-title":"IROS"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9811901"},{"key":"ref37","first-page":"1475","article-title":"Probabilistic and Geometric Depth: Detecting Objects in Perspective","volume":"164","author":"wang","year":"0","journal-title":"Conference on Robot Learning"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW54120.2021.00107"},{"key":"ref31","article-title":"Orthographic feature transform for monocular 3d object detection","author":"roddick","year":"2018","journal-title":"ArXiv"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01115"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561169"},{"key":"ref32","article-title":"ORA3D: Overlap Region Aware Multi-view 3D Object Detection","volume":"abs 2207 865","author":"kyoung roh","year":"2022","journal-title":"ArXiv"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19839-7_26"},{"key":"ref1","first-page":"4095","article-title":"A Geometric Approach to Obtain a Bird's Eye View From an Image","author":"ammar abbas","year":"2019","journal-title":"ICCV"},{"key":"ref39","article-title":"PolarNet: Learning to Optimize Polar Keypoints for Keypoint Based Object Detection","author":"wu","year":"2021","journal-title":"9th International Conference on Learning Representations ICLR 2021"},{"key":"ref38","first-page":"180","article-title":"DETR3D: 3D Object Detection from Multi-view Images via 3D-to-2D Queries","author":"wang","year":"0","journal-title":"Conference on Robot Learning"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/BF00201978"},{"key":"ref23","article-title":"Vision-Centric BEV Perception: A Survey","author":"ma","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref26","article-title":"BEVSegFormer: Bird's Eye View Semantic Segmentation From Arbitrary Camera Rigs","author":"peng","year":"2022","journal-title":"ArXiv"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2020.3004325"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/WACV48630.2021.00010"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19809-0_8"},{"key":"ref21","article-title":"Learning Ego 3D Representation as Ray Tracing","author":"lu","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00845"},{"key":"ref27","first-page":"194","article-title":"Lift, Splat, Shoot: Encoding Images from Arbitrary Camera Rigs by Implicitly Unprojecting to 3D","author":"philion","year":"2020","journal-title":"ECCV"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC45102.2020.9294462"}],"event":{"name":"2023 IEEE International Conference on Robotics and Automation (ICRA)","location":"London, United Kingdom","start":{"date-parts":[[2023,5,29]]},"end":{"date-parts":[[2023,6,2]]}},"container-title":["2023 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"https:\/\/2.zoppoz.workers.dev:443\/http\/xplorestaging.ieee.org\/ielx7\/10160211\/10160212\/10161552.pdf?arnumber=10161552","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,24]],"date-time":"2023-07-24T17:38:19Z","timestamp":1690220299000},"score":1,"resource":{"primary":{"URL":"https:\/\/2.zoppoz.workers.dev:443\/https\/ieeexplore.ieee.org\/document\/10161552\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,5,29]]},"references-count":49,"URL":"https:\/\/2.zoppoz.workers.dev:443\/https\/doi.org\/10.1109\/icra48891.2023.10161552","relation":{},"subject":[],"published":{"date-parts":[[2023,5,29]]}}}