{"id":"https://openalex.org/W7140285148","doi":"https://doi.org/10.48550/arxiv.2603.22999","title":"PaperVoyager : Building Interactive Web with Visual Language Models","display_name":"PaperVoyager : Building Interactive Web with Visual Language Models","publication_year":2026,"publication_date":"2026-03-24","ids":{"openalex":"https://openalex.org/W7140285148","doi":"https://doi.org/10.48550/arxiv.2603.22999"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22999","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22999","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22999","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010781772","display_name":"D. Z. Dai","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dai, Dasen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130572637","display_name":"Biao Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Biao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130612959","display_name":"Meng Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Meng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130594422","display_name":"Wenhao Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Wenhao","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5010781772"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.15189999341964722,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.15189999341964722,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.15029999613761902,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10789","display_name":"Interactive and Immersive Displays","score":0.08449999988079071,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.7494999766349792},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4408000111579895},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.3882000148296356},{"id":"https://openalex.org/keywords/interactive-design","display_name":"Interactive design","score":0.37070000171661377},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.3483999967575073},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.3474999964237213},{"id":"https://openalex.org/keywords/interactive-visualization","display_name":"Interactive visualization","score":0.34689998626708984},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.33090001344680786}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.842199981212616},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.7494999766349792},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5163999795913696},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4408000111579895},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.3882000148296356},{"id":"https://openalex.org/C86297840","wikidata":"https://www.wikidata.org/wiki/Q6045397","display_name":"Interactive design","level":2,"score":0.37070000171661377},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3677999973297119},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.3483999967575073},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3474999964237213},{"id":"https://openalex.org/C64073096","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Interactive visualization","level":3,"score":0.34689998626708984},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.33090001344680786},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.3294000029563904},{"id":"https://openalex.org/C118643609","wikidata":"https://www.wikidata.org/wiki/Q189210","display_name":"Web application","level":2,"score":0.31929999589920044},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2937000095844269},{"id":"https://openalex.org/C2780878386","wikidata":"https://www.wikidata.org/wiki/Q1659648","display_name":"Visual language","level":2,"score":0.29280000925064087},{"id":"https://openalex.org/C2777055276","wikidata":"https://www.wikidata.org/wiki/Q7936580","display_name":"Visual approach","level":2,"score":0.2858000099658966},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.27649998664855957},{"id":"https://openalex.org/C2779125210","wikidata":"https://www.wikidata.org/wiki/Q16622442","display_name":"Interactive programming","level":2,"score":0.27619999647140503},{"id":"https://openalex.org/C89505385","wikidata":"https://www.wikidata.org/wiki/Q47146","display_name":"User interface","level":2,"score":0.26759999990463257},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2667999863624573}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22999","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22999","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22999","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22999","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2],"visual":[3],"language":[4],"models":[5,123],"have":[6],"enabled":[7],"autonomous":[8],"agents":[9,21],"for":[10,37,146],"complex":[11],"reasoning,":[12],"tool":[13],"use,":[14],"and":[15,43,80,89,125],"document":[16,20],"understanding.":[17,150],"However,":[18],"existing":[19],"mainly":[22],"transform":[23],"papers":[24,39,57,104],"into":[25,58],"static":[26],"artifacts":[27],"such":[28],"as":[29,110],"summaries,":[30],"webpages,":[31],"or":[32],"slides,":[33],"which":[34],"are":[35],"insufficient":[36],"technical":[38],"involving":[40],"dynamic":[41,91],"mechanisms":[42,124],"state":[44],"transitions.":[45],"In":[46],"this":[47,95],"work,":[48],"we":[49,97],"propose":[50,115],"a":[51,64,99,117,143],"Paper-to-Interactive-System":[52],"Agent":[53],"that":[54,121,132],"converts":[55],"research":[56,103],"executable":[59],"interactive":[60,81,108,140,147],"web":[61],"systems.":[62],"Given":[63],"PDF":[65],"paper,":[66],"the":[67,136],"agent":[68],"performs":[69],"end-to-end":[70],"processing":[71],"without":[72],"human":[73],"intervention,":[74],"including":[75],"paper":[76,149],"understanding,":[77],"system":[78],"modeling,":[79],"webpage":[82],"synthesis,":[83],"enabling":[84],"users":[85],"to":[86],"manipulate":[87],"inputs":[88],"observe":[90],"behaviors.":[92],"To":[93],"evaluate":[94],"task,":[96],"introduce":[98],"benchmark":[100],"of":[101,138],"19":[102],"paired":[105],"with":[106],"expert-built":[107],"systems":[109],"ground":[111],"truth.":[112],"We":[113],"further":[114],"PaperVoyager,":[116],"structured":[118],"generation":[119],"framework":[120],"explicitly":[122],"interaction":[126],"logic":[127],"during":[128],"synthesis.":[129],"Experiments":[130],"show":[131],"PaperVoyager":[133],"significantly":[134],"improves":[135],"quality":[137],"generated":[139],"systems,":[141],"offering":[142],"new":[144],"paradigm":[145],"scientific":[148]},"counts_by_year":[],"updated_date":"2026-03-26T06:10:45.909354","created_date":"2026-03-26T00:00:00"}
