{"id":"https://openalex.org/W4280579537","doi":"https://doi.org/10.48550/arxiv.2205.09073","title":"Dialog Inpainting: Turning Documents into Dialogs","display_name":"Dialog Inpainting: Turning Documents into Dialogs","publication_year":2022,"publication_date":"2022-05-18","ids":{"openalex":"https://openalex.org/W4280579537","doi":"https://doi.org/10.48550/arxiv.2205.09073"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2205.09073","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2205.09073","pdf_url":"https://arxiv.org/pdf/2205.09073","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2205.09073","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062633736","display_name":"Zhuyun Dai","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dai, Zhuyun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024150057","display_name":"Arun Tejasvi Chaganty","orcid":"https://orcid.org/0000-0001-7122-1298"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chaganty, Arun Tejasvi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016423432","display_name":"Vincent Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Vincent","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034305203","display_name":"Aida Amini","orcid":"https://orcid.org/0000-0002-0576-5147"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Amini, Aida","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020446219","display_name":"Qazi Mamunur Rashid","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rashid, Qazi Mamunur","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029111089","display_name":"Mike Green","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Green, Mike","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5076669462","display_name":"Kelvin Guu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guu, Kelvin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5062633736"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dialog-box","display_name":"Dialog box","score":0.9675024747848511},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.790404736995697},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.7690465450286865},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6368334293365479},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6192212104797363},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5267966389656067},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5087304711341858},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.47002124786376953},{"id":"https://openalex.org/keywords/dialog-system","display_name":"Dialog system","score":0.4582814574241638},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4165574312210083},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.41210219264030457},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.22727951407432556},{"id":"https://openalex.org/keywords/history","display_name":"History","score":0.08541795611381531}],"concepts":[{"id":"https://openalex.org/C173853756","wikidata":"https://www.wikidata.org/wiki/Q86915","display_name":"Dialog box","level":2,"score":0.9675024747848511},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.790404736995697},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.7690465450286865},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6368334293365479},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6192212104797363},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5267966389656067},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5087304711341858},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.47002124786376953},{"id":"https://openalex.org/C190954187","wikidata":"https://www.wikidata.org/wiki/Q5270587","display_name":"Dialog system","level":3,"score":0.4582814574241638},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4165574312210083},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.41210219264030457},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.22727951407432556},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.08541795611381531},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2205.09073","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2205.09073","pdf_url":"https://arxiv.org/pdf/2205.09073","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2205.09073","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2205.09073","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2205.09073","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2205.09073","pdf_url":"https://arxiv.org/pdf/2205.09073","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6899999976158142,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2500779211","https://openalex.org/W48079147","https://openalex.org/W3133700904","https://openalex.org/W1963944933","https://openalex.org/W2563921006","https://openalex.org/W1600043506","https://openalex.org/W2097043665","https://openalex.org/W2013809956","https://openalex.org/W2063157598","https://openalex.org/W2107559347"],"abstract_inverted_index":{"Many":[0],"important":[1],"questions":[2],"(e.g.":[3],"\"How":[4],"to":[5,10,34,95,115,155,169,187],"eat":[6],"healthier?\")":[7],"require":[8],"conversation":[9],"establish":[11],"context":[12],"and":[13,49,63,73,89,119,125,151],"explore":[14],"in":[15,104],"depth.":[16],"However,":[17],"conversational":[18],"question":[19],"answering":[20],"(ConvQA)":[21],"systems":[22],"have":[23],"long":[24],"been":[25],"stymied":[26],"by":[27,86],"scarce":[28],"training":[29],"data":[30,168],"that":[31],"is":[32],"expensive":[33],"collect.":[35],"To":[36],"address":[37],"this":[38,113],"problem,":[39],"we":[40,77,122,174],"propose":[41],"a":[42,67,92],"new":[43],"technique":[44],"for":[45],"synthetically":[46],"generating":[47],"diverse":[48,132],"high-quality":[50],"dialog":[51,53,69,93],"data:":[52],"inpainting.":[54],"Our":[55],"approach":[56,114],"takes":[57],"the":[58,71,81,87,98,108,120,139,148],"text":[59],"of":[60,107,153],"any":[61],"document":[62],"transforms":[64],"it":[65],"into":[66],"two-person":[68],"between":[70,105],"writer":[72],"an":[74],"imagined":[75,99],"reader:":[76],"treat":[78],"sentences":[79],"from":[80,117],"article":[82],"as":[83,157],"utterances":[84],"spoken":[85],"writer,":[88],"then":[90],"use":[91],"inpainter":[94],"predict":[96],"what":[97],"reader":[100],"asked":[101],"or":[102,159],"said":[103],"each":[106],"writer's":[109],"utterances.":[110],"By":[111],"applying":[112],"passages":[116],"Wikipedia":[118],"web,":[121],"produce":[123],"WikiDialog":[124,154],"WebDialog,":[126],"two":[127],"datasets":[128],"totalling":[129],"19":[130],"million":[131],"information-seeking":[133],"dialogs":[134],"--":[135],"1,000x":[136],"larger":[137],"than":[138,161],"largest":[140],"existing":[141,162],"ConvQA":[142,171],"dataset.":[143],"Furthermore,":[144],"human":[145],"raters":[146],"judge":[147],"answer":[149],"adequacy":[150],"conversationality":[152],"be":[156],"good":[158],"better":[160],"manually-collected":[163],"datasets.":[164],"Using":[165],"our":[166],"inpainted":[167],"pre-train":[170],"retrieval":[172],"systems,":[173],"significantly":[175],"advance":[176],"state-of-the-art":[177],"across":[178],"three":[179],"benchmarks":[180],"(QReCC,":[181],"OR-QuAC,":[182],"TREC":[183],"CAsT)":[184],"yielding":[185],"up":[186],"40%":[188],"relative":[189],"gains":[190],"on":[191],"standard":[192],"evaluation":[193],"metrics.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":13},{"year":2022,"cited_by_count":3}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
