{"id":"https://openalex.org/W2798338993","doi":"https://doi.org/10.1109/cvpr.2018.00743","title":"A Face-to-Face Neural Conversation Model","display_name":"A Face-to-Face Neural Conversation Model","publication_year":2018,"publication_date":"2018-06-01","ids":{"openalex":"https://openalex.org/W2798338993","doi":"https://doi.org/10.1109/cvpr.2018.00743","mag":"2798338993"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr.2018.00743","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2018.00743","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102303167","display_name":"Hang Chu","orcid":null},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Hang Chu","raw_affiliation_strings":["University of Toronto"],"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038967947","display_name":"Daiqing Li","orcid":"https://orcid.org/0000-0001-5814-0872"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Daiqing Li","raw_affiliation_strings":["University of Toronto"],"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070642269","display_name":"Sanja Fidler","orcid":"https://orcid.org/0000-0003-1040-3260"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Sanja Fidler","raw_affiliation_strings":["University of Toronto"],"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102303167"],"corresponding_institution_ids":["https://openalex.org/I185261750"],"apc_list":null,"apc_paid":null,"fwci":1.149,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.83298024,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"7113","last_page":"7121"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.8609215021133423},{"id":"https://openalex.org/keywords/gesture","display_name":"Gesture","score":0.7852983474731445},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7621641159057617},{"id":"https://openalex.org/keywords/dialog-box","display_name":"Dialog box","score":0.704788327217102},{"id":"https://openalex.org/keywords/avatar","display_name":"Avatar","score":0.6176756620407104},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5841513872146606},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.5302597880363464},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.48186764121055603},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44935959577560425},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4087325632572174},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3533807098865509},{"id":"https://openalex.org/keywords/communication","display_name":"Communication","score":0.2004176378250122},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.18289878964424133},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.18207687139511108}],"concepts":[{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.8609215021133423},{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.7852983474731445},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7621641159057617},{"id":"https://openalex.org/C173853756","wikidata":"https://www.wikidata.org/wiki/Q86915","display_name":"Dialog box","level":2,"score":0.704788327217102},{"id":"https://openalex.org/C2777365542","wikidata":"https://www.wikidata.org/wiki/Q83090","display_name":"Avatar","level":2,"score":0.6176756620407104},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5841513872146606},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.5302597880363464},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.48186764121055603},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44935959577560425},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4087325632572174},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3533807098865509},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.2004176378250122},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.18289878964424133},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.18207687139511108},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvpr.2018.00743","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2018.00743","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5199999809265137,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W10957333","https://openalex.org/W1486649854","https://openalex.org/W1509031088","https://openalex.org/W1522301498","https://openalex.org/W1566289585","https://openalex.org/W1591706642","https://openalex.org/W2028422222","https://openalex.org/W2035046981","https://openalex.org/W2047508432","https://openalex.org/W2064675550","https://openalex.org/W2070353225","https://openalex.org/W2087064593","https://openalex.org/W2109606373","https://openalex.org/W2130942839","https://openalex.org/W2139196777","https://openalex.org/W2152826865","https://openalex.org/W2161466446","https://openalex.org/W2176263492","https://openalex.org/W2211242044","https://openalex.org/W2296371640","https://openalex.org/W2301937176","https://openalex.org/W2395639500","https://openalex.org/W2486034530","https://openalex.org/W2738406145","https://openalex.org/W2769375465","https://openalex.org/W2962883855","https://openalex.org/W2962968835","https://openalex.org/W2963084599","https://openalex.org/W2963167310","https://openalex.org/W2963206148","https://openalex.org/W2963248296","https://openalex.org/W2963488642","https://openalex.org/W2963542293","https://openalex.org/W2963790827","https://openalex.org/W2963890755","https://openalex.org/W2964121744","https://openalex.org/W2964268978","https://openalex.org/W2964352131","https://openalex.org/W3022187094","https://openalex.org/W4236521339","https://openalex.org/W6600426076","https://openalex.org/W6629028937","https://openalex.org/W6662335928","https://openalex.org/W6679436768","https://openalex.org/W6711957290","https://openalex.org/W6727862155"],"related_works":["https://openalex.org/W3138471234","https://openalex.org/W4247958311","https://openalex.org/W2098987383","https://openalex.org/W2417260800","https://openalex.org/W2795961259","https://openalex.org/W1596203174","https://openalex.org/W2117933979","https://openalex.org/W4298396513","https://openalex.org/W2283130723","https://openalex.org/W103938586"],"abstract_inverted_index":{"Neural":[0],"networks":[1],"have":[2],"recently":[3],"become":[4],"good":[5],"at":[6,90],"engaging":[7],"in":[8,104,133],"dialog.":[9],"However,":[10],"current":[11],"approaches":[12],"are":[13],"based":[14,52],"solely":[15],"on":[16,53],"verbal":[17,77,93],"text,":[18],"lacking":[19],"the":[20,54,57,68,76,86,92,100,105,109],"richness":[21],"of":[22,56,70,82],"a":[23,29,142,151],"real":[24],"face-to-face":[25,152],"conversation.":[26,58,78],"We":[27,116,127,145],"propose":[28],"neural":[30,119],"conversation":[31],"model":[32,47,132],"that":[33,66],"aims":[34,89],"to":[35,48],"read":[36],"and":[37,95,114,141],"generate":[38],"facial":[39,71,97],"gestures":[40],"alongside":[41],"with":[42,150],"text.":[43],"This":[44],"allows":[45],"our":[46,118,129],"adapt":[49],"its":[50],"response":[51,94],"\"mood\"":[55],"In":[59],"particular,":[60],"we":[61],"introduce":[62],"an":[63,147],"RNN":[64],"encoder-decoder":[65],"exploits":[67],"movement":[69],"muscles,":[72],"as":[73,75],"well":[74],"The":[79],"decoder":[80],"consists":[81],"two":[83],"layers,":[84],"where":[85],"lower":[87],"layer":[88,102],"generating":[91,134],"coarse":[96],"expressions,":[98],"while":[99],"second":[101],"fills":[103],"subtle":[106],"gestures,":[107],"making":[108],"generated":[110],"output":[111],"more":[112,135],"smooth":[113],"natural.":[115],"train":[117],"network":[120],"by":[121],"having":[122],"it":[123],"\"watch\"":[124],"250":[125],"movies.":[126],"showcase":[128],"joint":[130],"face-text":[131],"natural":[136],"conversations":[137],"through":[138],"automatic":[139],"metrics":[140],"human":[143],"study.":[144],"demonstrate":[146],"example":[148],"application":[149],"chatting":[153],"avatar.":[154]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
