{"id":"https://openalex.org/W3116628494","doi":"https://doi.org/10.18653/v1/2020.coling-tutorials.7","title":"Endangered Languages meet Modern NLP","display_name":"Endangered Languages meet Modern NLP","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3116628494","doi":"https://doi.org/10.18653/v1/2020.coling-tutorials.7","mag":"3116628494"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2020.coling-tutorials.7","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.coling-tutorials.7","pdf_url":"https://www.aclweb.org/anthology/2020.coling-tutorials.7.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Computational Linguistics: Tutorial Abstracts","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/2020.coling-tutorials.7.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013793053","display_name":"Antonios Anastasopoulos","orcid":"https://orcid.org/0000-0002-8544-246X"},"institutions":[{"id":"https://openalex.org/I162714631","display_name":"George Mason University","ror":"https://ror.org/02jqj7156","country_code":"US","type":"education","lineage":["https://openalex.org/I162714631"]},{"id":"https://openalex.org/I142740786","display_name":"University of Louisville","ror":"https://ror.org/01ckdn478","country_code":"US","type":"education","lineage":["https://openalex.org/I142740786"]},{"id":"https://openalex.org/I67031392","display_name":"Carleton University","ror":"https://ror.org/02qtvee93","country_code":"CA","type":"education","lineage":["https://openalex.org/I67031392"]},{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["CA","US"],"is_corresponding":true,"raw_author_name":"Antonios Anastasopoulos","raw_affiliation_strings":["School of Linguistics and Language Studies, Carleton University \u2663 Comparative Humanities, University of Louisville","Department of Computer Science, George Mason University \u2021 Language Technologies Institute, Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"School of Linguistics and Language Studies, Carleton University \u2663 Comparative Humanities, University of Louisville","institution_ids":["https://openalex.org/I67031392","https://openalex.org/I142740786"]},{"raw_affiliation_string":"Department of Computer Science, George Mason University \u2021 Language Technologies Institute, Carnegie Mellon University","institution_ids":["https://openalex.org/I162714631","https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019908886","display_name":"Christopher Cox","orcid":"https://orcid.org/0009-0003-1264-9245"},"institutions":[{"id":"https://openalex.org/I162714631","display_name":"George Mason University","ror":"https://ror.org/02jqj7156","country_code":"US","type":"education","lineage":["https://openalex.org/I162714631"]},{"id":"https://openalex.org/I142740786","display_name":"University of Louisville","ror":"https://ror.org/01ckdn478","country_code":"US","type":"education","lineage":["https://openalex.org/I142740786"]},{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]},{"id":"https://openalex.org/I67031392","display_name":"Carleton University","ror":"https://ror.org/02qtvee93","country_code":"CA","type":"education","lineage":["https://openalex.org/I67031392"]}],"countries":["CA","US"],"is_corresponding":false,"raw_author_name":"Christopher Cox","raw_affiliation_strings":["Department of Computer Science, George Mason University \u2021 Language Technologies Institute, Carnegie Mellon University","School of Linguistics and Language Studies, Carleton University \u2663 Comparative Humanities, University of Louisville"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, George Mason University \u2021 Language Technologies Institute, Carnegie Mellon University","institution_ids":["https://openalex.org/I162714631","https://openalex.org/I74973139"]},{"raw_affiliation_string":"School of Linguistics and Language Studies, Carleton University \u2663 Comparative Humanities, University of Louisville","institution_ids":["https://openalex.org/I67031392","https://openalex.org/I142740786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068811427","display_name":"Graham Neubig","orcid":"https://orcid.org/0000-0002-2072-3789"},"institutions":[{"id":"https://openalex.org/I162714631","display_name":"George Mason University","ror":"https://ror.org/02jqj7156","country_code":"US","type":"education","lineage":["https://openalex.org/I162714631"]},{"id":"https://openalex.org/I67031392","display_name":"Carleton University","ror":"https://ror.org/02qtvee93","country_code":"CA","type":"education","lineage":["https://openalex.org/I67031392"]},{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]},{"id":"https://openalex.org/I142740786","display_name":"University of Louisville","ror":"https://ror.org/01ckdn478","country_code":"US","type":"education","lineage":["https://openalex.org/I142740786"]}],"countries":["CA","US"],"is_corresponding":false,"raw_author_name":"Graham Neubig","raw_affiliation_strings":["Department of Computer Science, George Mason University \u2021 Language Technologies Institute, Carnegie Mellon University","School of Linguistics and Language Studies, Carleton University \u2663 Comparative Humanities, University of Louisville"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, George Mason University \u2021 Language Technologies Institute, Carnegie Mellon University","institution_ids":["https://openalex.org/I162714631","https://openalex.org/I74973139"]},{"raw_affiliation_string":"School of Linguistics and Language Studies, Carleton University \u2663 Comparative Humanities, University of Louisville","institution_ids":["https://openalex.org/I67031392","https://openalex.org/I142740786"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000564128","display_name":"Hilaria Cruz","orcid":null},"institutions":[{"id":"https://openalex.org/I142740786","display_name":"University of Louisville","ror":"https://ror.org/01ckdn478","country_code":"US","type":"education","lineage":["https://openalex.org/I142740786"]},{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]},{"id":"https://openalex.org/I162714631","display_name":"George Mason University","ror":"https://ror.org/02jqj7156","country_code":"US","type":"education","lineage":["https://openalex.org/I162714631"]},{"id":"https://openalex.org/I67031392","display_name":"Carleton University","ror":"https://ror.org/02qtvee93","country_code":"CA","type":"education","lineage":["https://openalex.org/I67031392"]}],"countries":["CA","US"],"is_corresponding":false,"raw_author_name":"Hilaria Cruz","raw_affiliation_strings":["Department of Computer Science, George Mason University \u2021 Language Technologies Institute, Carnegie Mellon University","School of Linguistics and Language Studies, Carleton University \u2663 Comparative Humanities, University of Louisville"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, George Mason University \u2021 Language Technologies Institute, Carnegie Mellon University","institution_ids":["https://openalex.org/I162714631","https://openalex.org/I74973139"]},{"raw_affiliation_string":"School of Linguistics and Language Studies, Carleton University \u2663 Comparative Humanities, University of Louisville","institution_ids":["https://openalex.org/I67031392","https://openalex.org/I142740786"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5013793053"],"corresponding_institution_ids":["https://openalex.org/I142740786","https://openalex.org/I162714631","https://openalex.org/I67031392","https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":0.7954,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.79166887,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"39","last_page":"45"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9853000044822693,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7202948331832886},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6708608269691467},{"id":"https://openalex.org/keywords/endangered-species","display_name":"Endangered species","score":0.6630834937095642},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5956816077232361},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.10961386561393738},{"id":"https://openalex.org/keywords/ecology","display_name":"Ecology","score":0.04892072081565857}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7202948331832886},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6708608269691467},{"id":"https://openalex.org/C179345059","wikidata":"https://www.wikidata.org/wiki/Q11394","display_name":"Endangered species","level":3,"score":0.6630834937095642},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5956816077232361},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.10961386561393738},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.04892072081565857},{"id":"https://openalex.org/C185933670","wikidata":"https://www.wikidata.org/wiki/Q52105","display_name":"Habitat","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2020.coling-tutorials.7","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.coling-tutorials.7","pdf_url":"https://www.aclweb.org/anthology/2020.coling-tutorials.7.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Computational Linguistics: Tutorial Abstracts","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2020.coling-tutorials.7","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.coling-tutorials.7","pdf_url":"https://www.aclweb.org/anthology/2020.coling-tutorials.7.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Computational Linguistics: Tutorial Abstracts","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.8399999737739563,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320310207","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33"},{"id":"https://openalex.org/F4320310249","display_name":"Carleton University","ror":"https://ror.org/02qtvee93"},{"id":"https://openalex.org/F4320310260","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3116628494.pdf","grobid_xml":"https://content.openalex.org/works/W3116628494.grobid-xml"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W1964331935","https://openalex.org/W2014840417","https://openalex.org/W2091746061","https://openalex.org/W2251408482","https://openalex.org/W2345799635","https://openalex.org/W2585654394","https://openalex.org/W2740382200","https://openalex.org/W2763898218","https://openalex.org/W2807710978","https://openalex.org/W2823189734","https://openalex.org/W2883972335","https://openalex.org/W2895097770","https://openalex.org/W2901616036","https://openalex.org/W2937657581","https://openalex.org/W2942683110","https://openalex.org/W2962712594","https://openalex.org/W2962899008","https://openalex.org/W2963014409","https://openalex.org/W2963091326","https://openalex.org/W2963826397","https://openalex.org/W2968525655","https://openalex.org/W2969530280","https://openalex.org/W2970913210","https://openalex.org/W2970963828","https://openalex.org/W2971882750","https://openalex.org/W2978709484","https://openalex.org/W3100160869","https://openalex.org/W4229891088","https://openalex.org/W4238795374","https://openalex.org/W4298876202","https://openalex.org/W4365799947"],"related_works":["https://openalex.org/W2151447942","https://openalex.org/W2611614995","https://openalex.org/W2368651715","https://openalex.org/W2789919619","https://openalex.org/W3107474891","https://openalex.org/W1552159754","https://openalex.org/W2148757832","https://openalex.org/W2293457016","https://openalex.org/W1870336386","https://openalex.org/W3169305685"],"abstract_inverted_index":{"This":[0],"tutorial":[1],"will":[2,14,45,71],"focus":[3],"on":[4,83],"NLP":[5,42,51,92,101],"for":[6],"endangered":[7],"languages":[8],"documentation":[9],"and":[10,21,35,81,87,110,117],"revitalization.":[11],"First,":[12],"we":[13,70],"acquaint":[15],"the":[16,19,22,29,32,36,48,74,85,88,115,120],"attendees":[17],"with":[18,114],"process":[20],"challenges":[23,75],"of":[24,31,76,90,119,123],"language":[25,33],"documentation,":[26],"showing":[27],"how":[28],"needs":[30],"communities":[34],"documentary":[37],"linguists":[38],"map":[39],"to":[40,98,103,129],"specific":[41],"tasks.":[43],"We":[44],"then":[46],"present":[47],"state-of-the-art":[49],"in":[50,53,78,127],"applied":[52],"this":[54,79,106],"particularly":[55],"challenging":[56],"setting":[57],"(extremely":[58],"low-resource":[59],"datasets,":[60],"noisy":[61],"transcriptions,":[62],"limited":[63],"annotations,":[64],"non-standard":[65],"orthographies).":[66],"In":[67],"doing":[68],"so,":[69],"also":[72,111],"analyze":[73],"working":[77],"domain":[80],"expand":[82],"both":[84,122],"capabilities":[86],"limitations":[89],"current":[91],"approaches.":[93],"Our":[94],"ultimate":[95],"goal":[96],"is":[97],"motivate":[99],"more":[100],"practitioners":[102],"work":[104],"towards":[105],"very":[107],"important":[108],"direction,":[109],"provide":[112],"them":[113],"tools":[116],"understanding":[118],"limitations/challenges,":[121],"which":[124],"are":[125],"needed":[126],"order":[128],"have":[130],"an":[131],"impact.":[132]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
