{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,10]],"date-time":"2026-02-10T16:10:39Z","timestamp":1770739839739,"version":"3.49.0"},"reference-count":49,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"name":"Chongqing Airport Group Company Ltd."},{"name":"Nanjing Lukou International Airport Technology Company Ltd"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2026]]},"DOI":"10.1109\/access.2026.3658620","type":"journal-article","created":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T21:00:22Z","timestamp":1769634022000},"page":"15748-15762","source":"Crossref","is-referenced-by-count":0,"title":["AIRFLOW: An End-to-End Spatial\u2013Channel Cross Attention Framework for Real-Time Passenger Detection and Tracking"],"prefix":"10.1109","volume":"14","author":[{"given":"Can","family":"Zhou","sequence":"first","affiliation":[{"name":"Expand Construction Command Department, Chongqing Airport Group Company Ltd., Chongqing, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-3064-647X","authenticated-orcid":false,"given":"Lei","family":"Wu","sequence":"additional","affiliation":[{"name":"Nanjing Lukou International Airport Technology Company Ltd., Nanjing, China"}]},{"given":"Zhangxin","family":"Kan","sequence":"additional","affiliation":[{"name":"Nanjing Lukou International Airport Technology Company Ltd., Nanjing, China"}]},{"given":"Hai","family":"Wang","sequence":"additional","affiliation":[{"name":"Expand Construction Command Department, Chongqing Airport Group Company Ltd., Chongqing, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01605"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2016.2577031"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.91"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.l007\/978-3-319-46448-0_2"},{"key":"ref7","article-title":"YOLOv3: An incremental improvement","author":"Redmon","year":"2018","journal-title":"arXiv:1804.02767"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2004.10934"},{"key":"ref9","volume-title":"YOLOv5 by Ultralytics","author":"Jocher","year":"2020"},{"key":"ref10","volume-title":"YOLOv8 By Ultralytics","author":"Jocher","year":"2023"},{"key":"ref11","article-title":"YOLOv10: Real-time end-to-end object detection","author":"Wang","year":"2024","journal-title":"arXiv:2405.14458"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1561\/116.20240058"},{"key":"ref13","article-title":"Deformable DETR: Deformable transformers for end-to-end object detection","author":"Zhu","year":"2020","journal-title":"arXiv:2010.04159"},{"key":"ref14","article-title":"DINO: DETR with improved DeNoising anchor boxes for end-to-end object detection","author":"Zhang","year":"2022","journal-title":"arXiv:2203.03605"},{"key":"ref15","article-title":"RT-DETRv2: Improved baseline with bag-of-freebies for real-time detection transformer","author":"Lv","year":"2024","journal-title":"arXiv:2407.17140"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2016.7533003"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2017.8296962"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20047-2_1"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-021-01513-4"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00864"},{"key":"ref21","article-title":"TransTrack: Multiple object tracking with transformer","author":"Sun","year":"2020","journal-title":"arXiv:2012.15460"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19812-0_38"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2025.3601598"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2025.3581391"},{"key":"ref25","article-title":"Spatial transformer networks","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Jaderberg"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00745"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1807.06521"},{"key":"ref28","article-title":"An image is worth 16\u00d716 words: Transformers for image recognition at scale","author":"Dosovitskiy","year":"2020","journal-title":"arXiv:2010.11929"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.474"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2011.155"},{"key":"ref32","article-title":"CrowdHuman: A benchmark for detecting human in a crowd","author":"Shao","year":"2018","journal-title":"arXiv:1805.00123"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2929005"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/s44267-024-00036-z"},{"key":"ref35","article-title":"MOT20: A benchmark for multi object tracking in crowded scenes","author":"Dendorfer","year":"2020","journal-title":"arXiv:2003.09003"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00644"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00978"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00972"},{"key":"ref40","first-page":"21002","article-title":"Generalized focal loss: Learning qualified and distributed bounding boxes for dense object detection","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Li"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00841"},{"key":"ref42","article-title":"YOLOX: Exceeding YOLO series in 2021","author":"Ge","year":"2021","journal-title":"arXiv:2107.08430"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2209.02976"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72751-1_1"},{"key":"ref46","article-title":"RTMDet: An empirical study of designing real-time object detectors","author":"Lyu","year":"2022","journal-title":"arXiv:2212.07784"},{"key":"ref47","article-title":"DAB-DETR: Dynamic anchor boxes are better queries for DETR","author":"Liu","year":"2022","journal-title":"arXiv:2201.12329"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01325"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00621"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6287639\/11323511\/11366873.pdf?arnumber=11366873","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,9]],"date-time":"2026-02-09T21:08:35Z","timestamp":1770671315000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11366873\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"references-count":49,"URL":"https:\/\/doi.org\/10.1109\/access.2026.3658620","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]}}}