{"id":"https://openalex.org/W4409366542","doi":"https://doi.org/10.1609/aaai.v39i7.32773","title":"Modality-Aware Shot Relating and Comparing for Video Scene Detection","display_name":"Modality-Aware Shot Relating and Comparing for Video Scene Detection","publication_year":2025,"publication_date":"2025-04-11","ids":{"openalex":"https://openalex.org/W4409366542","doi":"https://doi.org/10.1609/aaai.v39i7.32773"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v39i7.32773","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v39i7.32773","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/32773/34928","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/32773/34928","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053386671","display_name":"Jiawei Tan","orcid":"https://orcid.org/0000-0003-3299-0785"},"institutions":[{"id":"https://openalex.org/I4210094876","display_name":"Ministry of Education","ror":"https://ror.org/00q919b81","country_code":"SA","type":"government","lineage":["https://openalex.org/I4210094876"]}],"countries":["SA"],"is_corresponding":true,"raw_author_name":"Jiawei Tan","raw_affiliation_strings":["Key Laboratory of Dependable Service Computing in Cyber Physical Society (Chongqing University), Ministry of Education, China\nSchool of Big Data and Software Engineering, Chongqing University, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Dependable Service Computing in Cyber Physical Society (Chongqing University), Ministry of Education, China\nSchool of Big Data and Software Engineering, Chongqing University, China","institution_ids":["https://openalex.org/I4210094876"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115596036","display_name":"Hongxing Wang","orcid":"https://orcid.org/0009-0000-9803-7503"},"institutions":[{"id":"https://openalex.org/I4210094876","display_name":"Ministry of Education","ror":"https://ror.org/00q919b81","country_code":"SA","type":"government","lineage":["https://openalex.org/I4210094876"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Hongxing Wang","raw_affiliation_strings":["Key Laboratory of Dependable Service Computing in Cyber Physical Society (Chongqing University), Ministry of Education, China\nSchool of Big Data and Software Engineering, Chongqing University, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Dependable Service Computing in Cyber Physical Society (Chongqing University), Ministry of Education, China\nSchool of Big Data and Software Engineering, Chongqing University, China","institution_ids":["https://openalex.org/I4210094876"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101105741","display_name":"Kang Dang","orcid":"https://orcid.org/0000-0003-0613-2787"},"institutions":[{"id":"https://openalex.org/I69356397","display_name":"Xi\u2019an Jiaotong-Liverpool University","ror":"https://ror.org/03zmrmn05","country_code":"CN","type":"education","lineage":["https://openalex.org/I69356397"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kang Dang","raw_affiliation_strings":["School of AI and Advanced Computing, XJTLU Entrepreneur College (Taicang), Xi\u2019an Jiaotong-Liverpool University, Suzhou, China"],"affiliations":[{"raw_affiliation_string":"School of AI and Advanced Computing, XJTLU Entrepreneur College (Taicang), Xi\u2019an Jiaotong-Liverpool University, Suzhou, China","institution_ids":["https://openalex.org/I69356397"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010619966","display_name":"Jiaxin Li","orcid":"https://orcid.org/0000-0003-2251-8815"},"institutions":[{"id":"https://openalex.org/I4210094876","display_name":"Ministry of Education","ror":"https://ror.org/00q919b81","country_code":"SA","type":"government","lineage":["https://openalex.org/I4210094876"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Jiaxin Li","raw_affiliation_strings":["Key Laboratory of Dependable Service Computing in Cyber Physical Society (Chongqing University), Ministry of Education, China\nSchool of Big Data and Software Engineering, Chongqing University, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Dependable Service Computing in Cyber Physical Society (Chongqing University), Ministry of Education, China\nSchool of Big Data and Software Engineering, Chongqing University, China","institution_ids":["https://openalex.org/I4210094876"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061500807","display_name":"Zhilong Ou","orcid":"https://orcid.org/0000-0002-8587-1854"},"institutions":[{"id":"https://openalex.org/I4210094876","display_name":"Ministry of Education","ror":"https://ror.org/00q919b81","country_code":"SA","type":"government","lineage":["https://openalex.org/I4210094876"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Zhilong Ou","raw_affiliation_strings":["Key Laboratory of Dependable Service Computing in Cyber Physical Society (Chongqing University), Ministry of Education, China\nSchool of Big Data and Software Engineering, Chongqing University, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Dependable Service Computing in Cyber Physical Society (Chongqing University), Ministry of Education, China\nSchool of Big Data and Software Engineering, Chongqing University, China","institution_ids":["https://openalex.org/I4210094876"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5053386671"],"corresponding_institution_ids":["https://openalex.org/I4210094876"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.18237454,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"39","issue":"7","first_page":"7193","last_page":"7201"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.8100745677947998},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.803001880645752},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5395148992538452},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5137942433357239},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45182156562805176}],"concepts":[{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.8100745677947998},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.803001880645752},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5395148992538452},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5137942433357239},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45182156562805176},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v39i7.32773","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v39i7.32773","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/32773/34928","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v39i7.32773","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v39i7.32773","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/32773/34928","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G316265475","display_name":null,"funder_award_id":"61976029","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4409366542.pdf","grobid_xml":"https://content.openalex.org/works/W4409366542.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Video":[0],"scene":[1,98,182,211],"detection":[2,61],"involves":[3],"assessing":[4],"whether":[5],"each":[6,36,171],"shot":[7,116,121,130,142,158,173],"and":[8,26,31,45,72,87,111,149,167],"its":[9],"surroundings":[10],"belong":[11],"to":[12,59,96,103],"the":[13,52,68,106,163,179,187,191,205],"same":[14],"scene.":[15],"Achieving":[16],"this":[17,64,136],"requires":[18],"meticulously":[19],"correlating":[20],"multi-modal":[21,42],"cues,":[22],"e.g.,":[23],"visual":[24,85,109],"entity":[25,86,110,124],"place":[27,88,112,133],"modalities,":[28,89],"among":[29],"shots":[30,79,169],"comparing":[32,93],"semantic":[33],"changes":[34,99],"around":[35],"shot.":[37],"However,":[38],"most":[39],"methods":[40],"treat":[41],"semantics":[43,125],"equally":[44],"do":[46],"not":[47],"examine":[48],"contextual":[49],"differences":[50],"between":[51,165],"two":[53],"sides":[54],"of":[55,84,108,170,181,190],"a":[56],"shot,":[57],"leading":[58],"sub-optimal":[60],"performance.":[62],"In":[63,135],"paper,":[65],"we":[66,118,138,160],"propose":[67],"Modality-Aware":[69],"Shot":[70],"Relating":[71],"Comparing":[73],"approach":[74],"(MASRC),":[75],"which":[76],"enables":[77],"relating":[78],"per":[80],"their":[81],"own":[82],"characteristics":[83],"as":[90,92],"well":[91],"multi-shots":[94],"similarities":[95],"have":[97],"explicitly":[100],"encoded.":[101],"Specifically,":[102],"fully":[104],"harness":[105],"potential":[107],"modalities":[113],"in":[114,178,194],"modeling":[115],"relations,":[117],"mine":[119],"long-term":[120],"correlations":[122,131],"from":[123,132],"while":[126],"simultaneously":[127],"revealing":[128],"short-term":[129],"semantics.":[134],"way,":[137],"can":[139],"learn":[140],"distinctive":[141,157],"features":[143],"that":[144,204],"consolidate":[145],"coherence":[146],"within":[147],"scenes":[148],"amplify":[150],"distinguishability":[151],"across":[152],"scenes.":[153],"Once":[154],"equipped":[155],"with":[156],"features,":[159],"further":[161],"encode":[162],"relations":[164],"preceding":[166],"succeeding":[168],"target":[172],"by":[174],"similarity":[175],"convolution,":[176],"aiding":[177],"identification":[180],"ending":[183],"shots.":[184],"We":[185],"validate":[186],"broad":[188],"applicability":[189],"proposed":[192,206],"components":[193],"MASRC.":[195],"Extensive":[196],"experimental":[197],"results":[198],"on":[199],"public":[200],"benchmark":[201],"datasets":[202],"demonstrate":[203],"MASRC":[207],"significantly":[208],"advances":[209],"video":[210],"detection.":[212]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
