{"id":"https://openalex.org/W6891883924","doi":"https://doi.org/10.48550/arxiv.2507.21460","title":"An Angular-Temporal Interaction Network for Light Field Object Tracking in Low-Light Scenes","display_name":"An Angular-Temporal Interaction Network for Light Field Object Tracking in Low-Light Scenes","publication_year":2025,"publication_date":"2025-07-29","ids":{"openalex":"https://openalex.org/W6891883924","doi":"https://doi.org/10.48550/arxiv.2507.21460"},"language":"en","primary_location":{"id":"doi:10.48550/arxiv.2507.21460","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.21460","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2507.21460","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Wang, Mianzhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Mianzhao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Shi, Fan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Fan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Cheng, Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Xu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhang, Feifei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Feifei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Chen, Shengyong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Shengyong","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.5620999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.5620999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.1348000019788742,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.09860000014305115,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/light-field","display_name":"Light field","score":0.7631000280380249},{"id":"https://openalex.org/keywords/epipolar-geometry","display_name":"Epipolar geometry","score":0.7107999920845032},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.5249000191688538},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5134000182151794},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.47589999437332153},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.4672999978065491},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.46560001373291016},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.45339998602867126}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7742000222206116},{"id":"https://openalex.org/C48983235","wikidata":"https://www.wikidata.org/wiki/Q593161","display_name":"Light field","level":2,"score":0.7631000280380249},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7555999755859375},{"id":"https://openalex.org/C23379248","wikidata":"https://www.wikidata.org/wiki/Q200904","display_name":"Epipolar geometry","level":3,"score":0.7107999920845032},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6169999837875366},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.5249000191688538},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5134000182151794},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.47589999437332153},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.4672999978065491},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.46560001373291016},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.45339998602867126},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.4047999978065491},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.40380001068115234},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.38530001044273376},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.3402999937534332},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.32170000672340393},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.3034000098705292},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.289000004529953},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2831000089645386},{"id":"https://openalex.org/C193581530","wikidata":"https://www.wikidata.org/wiki/Q683778","display_name":"Structured light","level":2,"score":0.2761000096797943},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.26080000400543213},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.25999999046325684},{"id":"https://openalex.org/C3020368824","wikidata":"https://www.wikidata.org/wiki/Q6546192","display_name":"Light intensity","level":2,"score":0.25529998540878296}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2507.21460","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.21460","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2507.21460","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.21460","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7815021276473999}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"High-quality":[0],"4D":[1],"light":[2,52,67,79,99,110,128,155,191],"field":[3,53,111,156,192],"representation":[4,58,86],"with":[5],"efficient":[6],"angular":[7,34],"feature":[8,144],"modeling":[9,35],"is":[10],"crucial":[11],"for":[12,109,159],"scene":[13],"perception,":[14],"as":[15],"it":[16],"can":[17,87,132],"provide":[18],"discriminative":[19],"spatial-angular":[20],"cues":[21,122,126],"to":[22,31,140,180],"identify":[23],"moving":[24],"targets.":[25],"However,":[26],"recent":[27],"developments":[28],"still":[29],"struggle":[30],"deliver":[32],"reliable":[33],"in":[36,41,75,91,97,136,170],"the":[37,62,66,72,76,82,119,142,147,177,187],"temporal":[38,148],"domain,":[39],"particularly":[40],"complex":[42],"low-light":[43,92,157],"scenes.":[44],"In":[45],"this":[46,85],"paper,":[47],"we":[48,151,175],"propose":[49,103],"a":[50,137,153],"novel":[51],"epipolar-plane":[54],"structure":[55,64],"image":[56],"(ESI)":[57],"that":[59,114,165],"explicitly":[60],"defines":[61],"geometric":[63,120,143],"within":[65,81],"field.":[68],"By":[69],"capitalizing":[70],"on":[71],"abrupt":[73],"changes":[74],"angles":[77],"of":[78,127,189],"rays":[80],"epipolar":[83],"plane,":[84],"enhance":[88,141],"visual":[89],"expression":[90],"scenes":[93],"and":[94,123],"reduce":[95],"redundancy":[96],"high-dimensional":[98],"fields.":[100,129],"We":[101],"further":[102],"an":[104],"angular-temporal":[105,124,193],"interaction":[106,125,145],"network":[107],"(ATINet)":[108],"object":[112,160,172,182],"tracking":[113],"learns":[115],"angular-aware":[116],"representations":[117],"from":[118],"structural":[121],"Furthermore,":[130,174],"ATINet":[131,166],"also":[133,185],"be":[134],"optimized":[135],"self-supervised":[138],"manner":[139],"across":[146],"domain.":[149],"Finally,":[150],"introduce":[152],"large-scale":[154],"dataset":[158],"tracking.":[161,173],"Extensive":[162],"experimentation":[163],"demonstrates":[164],"achieves":[167],"state-of-the-art":[168],"performance":[169],"single":[171],"extend":[176],"proposed":[178],"method":[179],"multiple":[181],"tracking,":[183],"which":[184],"shows":[186],"effectiveness":[188],"high-quality":[190],"modeling.":[194]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
