{"id":"https://openalex.org/W7151245152","doi":"https://doi.org/10.48550/arxiv.2604.03592","title":"Unveiling Language Routing Isolation in Multilingual MoE Models for Interpretable Subnetwork Adaptation","display_name":"Unveiling Language Routing Isolation in Multilingual MoE Models for Interpretable Subnetwork Adaptation","publication_year":2026,"publication_date":"2026-04-04","ids":{"openalex":"https://openalex.org/W7151245152","doi":"https://doi.org/10.48550/arxiv.2604.03592"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.03592","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03592","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.03592","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133110190","display_name":"Kening Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zheng, Kening","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133102673","display_name":"Wei-Chieh Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Wei-Chieh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133126420","display_name":"Jiahao Huo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huo, Jiahao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133124690","display_name":"Zhonghao Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Zhonghao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133143964","display_name":"Henry Peng Zou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zou, Henry Peng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133131093","display_name":"Yibo Yan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Yibo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133102762","display_name":"Xin Zou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zou, Xin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129930813","display_name":"Jungang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jungang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133069076","display_name":"Junzhuo Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Junzhuo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133105521","display_name":"Hanrong Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Hanrong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133075729","display_name":"Xuming Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Xuming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133143738","display_name":"Philip S. Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Philip S.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5133110190"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.34360000491142273,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.34360000491142273,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.08889999985694885,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.051500000059604645,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/subnetwork","display_name":"Subnetwork","score":0.9745000004768372},{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.6581000089645386},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.604200005531311},{"id":"https://openalex.org/keywords/disjoint-sets","display_name":"Disjoint sets","score":0.5788999795913696},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5442000031471252},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.489300012588501},{"id":"https://openalex.org/keywords/isolation","display_name":"Isolation (microbiology)","score":0.4681999981403351}],"concepts":[{"id":"https://openalex.org/C2780186347","wikidata":"https://www.wikidata.org/wiki/Q11414","display_name":"Subnetwork","level":2,"score":0.9745000004768372},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6934000253677368},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.6581000089645386},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.604200005531311},{"id":"https://openalex.org/C45340560","wikidata":"https://www.wikidata.org/wiki/Q215382","display_name":"Disjoint sets","level":2,"score":0.5788999795913696},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5442000031471252},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.489300012588501},{"id":"https://openalex.org/C2775941552","wikidata":"https://www.wikidata.org/wiki/Q25212305","display_name":"Isolation (microbiology)","level":2,"score":0.4681999981403351},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4571000039577484},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4009999930858612},{"id":"https://openalex.org/C24856439","wikidata":"https://www.wikidata.org/wiki/Q352483","display_name":"Adaptive routing","level":5,"score":0.3846000134944916},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37880000472068787},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.36649999022483826},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.2980000078678131},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.2775999903678894},{"id":"https://openalex.org/C50335755","wikidata":"https://www.wikidata.org/wiki/Q483247","display_name":"Phenomenon","level":2,"score":0.26930001378059387},{"id":"https://openalex.org/C204948658","wikidata":"https://www.wikidata.org/wiki/Q1119410","display_name":"Static routing","level":4,"score":0.2687999904155731}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.03592","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03592","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.03592","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03592","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Mixture-of-Experts":[0],"(MoE)":[1],"models":[2],"exhibit":[3,64],"striking":[4],"performance":[5,140],"disparities":[6],"across":[7,69],"languages,":[8],"yet":[9],"the":[10,127],"internal":[11],"mechanisms":[12],"driving":[13],"these":[14,74],"gaps":[15],"remain":[16],"poorly":[17],"understood.":[18],"In":[19],"this":[20],"work,":[21],"we":[22,37,58,76],"conduct":[23],"a":[24,35,65,83,98],"systematic":[25],"analysis":[26],"of":[27,158],"expert":[28,53,94],"routing":[29,62,87],"patterns":[30,63],"in":[31,42,109,121,144],"MoE":[32],"models,":[33],"revealing":[34],"phenomenon":[36],"term":[38],"Language":[39],"Routing":[40],"Isolation,":[41],"which":[43],"high-":[44],"and":[45,91,111,114],"low-resource":[46,138],"languages":[47,150],"tend":[48],"to":[49,89,105,117,160],"activate":[50],"largely":[51],"disjoint":[52],"sets.":[54],"Through":[55],"layer-stratified":[56],"analysis,":[57],"further":[59],"show":[60],"that":[61,85,152],"layer-wise":[66],"convergence-divergence":[67],"pattern":[68],"model":[70],"depth.":[71],"Building":[72],"on":[73,148],"findings,":[75],"propose":[77],"RISE":[78,96,135,153],"(Routing":[79],"Isolation-guided":[80],"Subnetwork":[81],"Enhancement),":[82],"framework":[84],"exploits":[86],"isolation":[88],"identify":[90,106],"adapt":[92],"language-specific":[93,107],"subnetworks.":[95],"applies":[97],"tripartite":[99],"selection":[100],"strategy,":[101],"using":[102],"specificity":[103],"scores":[104,116],"experts":[108,120],"shallow":[110],"deep":[112],"layers":[113],"overlap":[115],"select":[118],"universal":[119],"middle":[122],"layers.":[123],"By":[124],"training":[125],"only":[126],"selected":[128],"subnetwork":[129],"while":[130,141],"freezing":[131],"all":[132],"other":[133,145],"parameters,":[134],"substantially":[136],"improves":[137],"language":[139],"preserving":[142],"capabilities":[143],"languages.":[146],"Experiments":[147],"10":[149],"demonstrate":[151],"achieves":[154],"target-language":[155],"F1":[156],"gains":[157],"up":[159],"10.85%":[161],"with":[162],"minimal":[163],"cross-lingual":[164],"degradation.":[165]},"counts_by_year":[],"updated_date":"2026-04-08T06:07:18.267832","created_date":"2026-04-08T00:00:00"}
