{"id":"https://openalex.org/W4405710118","doi":"https://doi.org/10.1109/iscslp63861.2024.10800749","title":"StreamAAD: Decoding Spatial Auditory Attention with a Streaming Architecture","display_name":"StreamAAD: Decoding Spatial Auditory Attention with a Streaming Architecture","publication_year":2024,"publication_date":"2024-11-07","ids":{"openalex":"https://openalex.org/W4405710118","doi":"https://doi.org/10.1109/iscslp63861.2024.10800749"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp63861.2024.10800749","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp63861.2024.10800749","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 14th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036345679","display_name":"Zelin Qiu","orcid":"https://orcid.org/0000-0002-8952-2328"},"institutions":[{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zelin Qiu","raw_affiliation_strings":["Institute of Acoustics, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102802382","display_name":"Dingding Yao","orcid":"https://orcid.org/0000-0002-9610-8782"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dingding Yao","raw_affiliation_strings":["Institute of Acoustics, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100450054","display_name":"Junfeng Li","orcid":"https://orcid.org/0000-0002-4841-4574"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junfeng Li","raw_affiliation_strings":["Institute of Acoustics, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Institute of Acoustics, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5036345679"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210099069"],"apc_list":null,"apc_paid":null,"fwci":0.7257,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.71988796,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.968500018119812,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.968500018119812,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10914","display_name":"Tactile and Sensory Interactions","score":0.95660001039505,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12032","display_name":"Multisensory perception and integration","score":0.9366000294685364,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.8531316518783569},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7977395057678223},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.5879849195480347},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4585977792739868},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.18936967849731445},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.06505191326141357}],"concepts":[{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.8531316518783569},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7977395057678223},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.5879849195480347},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4585977792739868},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.18936967849731445},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.06505191326141357},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscslp63861.2024.10800749","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp63861.2024.10800749","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 14th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.699999988079071}],"awards":[{"id":"https://openalex.org/G8717273534","display_name":null,"funder_award_id":"12104483","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1857789879","https://openalex.org/W1991139021","https://openalex.org/W2064675550","https://openalex.org/W2158904676","https://openalex.org/W2789758093","https://openalex.org/W2990116258","https://openalex.org/W3003432884","https://openalex.org/W3093647835","https://openalex.org/W3126966983","https://openalex.org/W3159696612","https://openalex.org/W4206654584","https://openalex.org/W4301367357","https://openalex.org/W4391160633","https://openalex.org/W4392903877","https://openalex.org/W4401023906","https://openalex.org/W6637242042","https://openalex.org/W6789284391","https://openalex.org/W6947496921"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"In":[0,68],"this":[1,57],"paper,":[2],"we":[3,59,93],"present":[4],"our":[5],"approach":[6],"for":[7,86],"the":[8,12,75,87,104,109],"Track":[9],"1":[10],"of":[11,89],"Chinese":[13],"Auditory":[14],"Attention":[15],"Decoding":[16],"(Chinese":[17],"AAD)":[18],"Challenge":[19],"at":[20],"ISCSLP":[21],"2024.":[22],"Most":[23],"existing":[24],"spatial":[25],"auditory":[26],"attention":[27],"decoding":[28,64],"(Sp-AAD)":[29],"methods":[30],"employ":[31,94],"an":[32],"isolated":[33],"window":[34],"architecture,":[35,65],"focusing":[36],"solely":[37],"on":[38],"global":[39],"invariant":[40],"features":[41],"without":[42],"considering":[43],"relationships":[44],"between":[45],"different":[46],"decision":[47,70],"windows,":[48],"which":[49],"can":[50],"lead":[51],"to":[52,74],"suboptimal":[53],"performance.":[54],"To":[55],"address":[56],"issue,":[58],"propose":[60],"a":[61,78,95],"novel":[62],"streaming":[63],"termed":[66],"StreamAAD.":[67],"StreamAAD,":[69],"windows":[71],"are":[72],"input":[73],"network":[76],"as":[77],"sequential":[79],"stream":[80],"and":[81],"decoded":[82],"in":[83,108],"order,":[84],"allowing":[85],"modeling":[88],"inter-window":[90],"relationships.":[91],"Additionally,":[92],"model":[96],"ensemble":[97],"strategy,":[98],"achieving":[99],"significant":[100],"better":[101],"performance":[102],"than":[103],"baseline,":[105],"ranking":[106],"First":[107],"challenge.":[110]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
