{"id":"https://openalex.org/W4389575063","doi":"https://doi.org/10.1145/3610548.3618174","title":"UVDoc: Neural Grid-based Document Unwarping","display_name":"UVDoc: Neural Grid-based Document Unwarping","publication_year":2023,"publication_date":"2023-12-10","ids":{"openalex":"https://openalex.org/W4389575063","doi":"https://doi.org/10.1145/3610548.3618174"},"language":"en","primary_location":{"id":"doi:10.1145/3610548.3618174","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3610548.3618174","pdf_url":null,"source":null,"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIGGRAPH Asia 2023 Conference Papers","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3610548.3618174","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002034143","display_name":"Floor Verhoeven","orcid":"https://orcid.org/0000-0003-3768-0460"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Floor Verhoeven","raw_affiliation_strings":["ETH Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043613770","display_name":"Tanguy Magne","orcid":"https://orcid.org/0009-0001-0231-026X"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Tanguy Magne","raw_affiliation_strings":["ETH Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064927253","display_name":"Olga Sorkine\u2010Hornung","orcid":"https://orcid.org/0000-0002-8089-3974"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Olga Sorkine-Hornung","raw_affiliation_strings":["ETH Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5002034143"],"corresponding_institution_ids":["https://openalex.org/I35440088"],"apc_list":null,"apc_paid":null,"fwci":1.4443,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.84570823,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10638","display_name":"Optical measurement and interference techniques","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8348318338394165},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7413631081581116},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.6887592077255249},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6038134098052979},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.5800365805625916},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5441005229949951},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.5038804411888123},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.47795891761779785},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.4369671642780304},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.4349937438964844},{"id":"https://openalex.org/keywords/viewport","display_name":"Viewport","score":0.41645869612693787}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8348318338394165},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7413631081581116},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.6887592077255249},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6038134098052979},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.5800365805625916},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5441005229949951},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.5038804411888123},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.47795891761779785},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.4369671642780304},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.4349937438964844},{"id":"https://openalex.org/C2778090530","wikidata":"https://www.wikidata.org/wiki/Q2523931","display_name":"Viewport","level":2,"score":0.41645869612693787},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3610548.3618174","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3610548.3618174","pdf_url":null,"source":null,"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIGGRAPH Asia 2023 Conference Papers","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3610548.3618174","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3610548.3618174","pdf_url":null,"source":null,"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIGGRAPH Asia 2023 Conference Papers","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.6899999976158142}],"awards":[{"id":"https://openalex.org/G3530536246","display_name":null,"funder_award_id":"101003104","funder_id":"https://openalex.org/F4320334678","funder_display_name":"European Research Council"}],"funders":[{"id":"https://openalex.org/F4320334678","display_name":"European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W236100371","https://openalex.org/W2027238116","https://openalex.org/W2033628967","https://openalex.org/W2047643928","https://openalex.org/W2084911352","https://openalex.org/W2098270921","https://openalex.org/W2115263911","https://openalex.org/W2120449447","https://openalex.org/W2121498135","https://openalex.org/W2129165900","https://openalex.org/W2140089569","https://openalex.org/W2145032989","https://openalex.org/W2149884040","https://openalex.org/W2161175365","https://openalex.org/W2412396436","https://openalex.org/W2786983711","https://openalex.org/W2798905980","https://openalex.org/W2894857688","https://openalex.org/W2981771415","https://openalex.org/W2985998306","https://openalex.org/W3047176958","https://openalex.org/W3049081235","https://openalex.org/W3207713347","https://openalex.org/W3210178292","https://openalex.org/W4214546754","https://openalex.org/W4221149365","https://openalex.org/W4251279466","https://openalex.org/W4285529970","https://openalex.org/W4285981773","https://openalex.org/W4304091571","https://openalex.org/W4311992557","https://openalex.org/W4312462986","https://openalex.org/W4312861879","https://openalex.org/W4312891697","https://openalex.org/W4312950516","https://openalex.org/W4313829392","https://openalex.org/W4366458615","https://openalex.org/W4367368531"],"related_works":["https://openalex.org/W4389095575","https://openalex.org/W2908978341","https://openalex.org/W4294975495","https://openalex.org/W2992753629","https://openalex.org/W3161069372","https://openalex.org/W3171203216","https://openalex.org/W3123914255","https://openalex.org/W4225714298","https://openalex.org/W2948809149","https://openalex.org/W3035535334"],"abstract_inverted_index":{"Restoring":[0],"the":[1,52,57,60,71,74,103,138,157,166,178,194,200],"original,":[2],"flat":[3],"appearance":[4,101],"of":[5,12,56,76,80,159,180,203],"a":[6,18,27,42,66,77,220,230],"printed":[7],"document":[8,33,58,121,164],"from":[9],"casual":[10],"photographs":[11],"bent":[13],"and":[14,59,82,111,128,210,228,241],"wrinkled":[15],"pages":[16],"is":[17,97,134],"common":[19],"everyday":[20],"problem.":[21],"In":[22,86],"this":[23],"paper":[24,81],"we":[25,109],"propose":[26,229],"novel":[28,182,221],"method":[29,36],"for":[30,208],"grid-based":[31],"single-image":[32],"unwarping.":[34,237],"Our":[35,132,238],"performs":[37],"geometric":[38],"distortion":[39],"correction":[40],"via":[41],"fully":[43],"convolutional":[44],"deep":[45],"neural":[46],"network":[47,188],"that":[48,96,153,174,176,199,224,232],"learns":[49],"to":[50,88,92,141,148],"predict":[51],"3D":[53,78,126],"grid":[54,64],"mesh":[55],"corresponding":[61],"2D":[62,84],"unwarping":[63,90,129,144],"in":[65,100,163,165],"dual-task":[67],"fashion,":[68],"implicitly":[69],"encoding":[70],"coupling":[72],"between":[73],"shape":[75,127],"piece":[79],"its":[83],"image.":[85],"order":[87],"allow":[89],"models":[91],"train":[93,142],"on":[94,193],"data":[95],"more":[98],"realistic":[99],"than":[102],"commonly":[104],"used":[105],"synthetic":[106],"Doc3D":[107],"dataset,":[108,115,184],"create":[110],"publish":[112],"our":[113,143,181,185,204],"own":[114],"called":[116],"UVDoc,":[117],"which":[118],"combines":[119],"pseudo-photorealistic":[120,183,201],"images":[122],"with":[123,136,156,177],"physically":[124],"accurate":[125],"function":[130],"annotations.":[131],"dataset":[133,206,223,243],"labeled":[135],"all":[137],"information":[139],"necessary":[140],"network,":[145],"without":[146],"having":[147],"engineer":[149],"separate":[150],"loss":[151],"functions":[152],"can":[154],"deal":[155],"lack":[158],"ground-truth":[160],"typically":[161],"found":[162],"wild":[167],"datasets.":[168],"We":[169,197,218],"perform":[170],"an":[171],"in-depth":[172],"evaluation":[173,212],"demonstrates":[175],"inclusion":[179],"relatively":[186],"small":[187],"architecture":[189],"achieves":[190],"state-of-the-art":[191],"results":[192,240],"DocUNet":[195],"benchmark.":[196],"show":[198],"nature":[202],"UVDoc":[205,242],"allows":[207],"new":[209],"better":[211],"methods,":[213],"such":[214,226],"as":[215],"lighting-corrected":[216],"MS-SSIM.":[217],"provide":[219],"benchmark":[222],"facilitates":[225],"evaluations,":[227],"metric":[231],"quantifies":[233],"line":[234],"straightness":[235],"after":[236],"code,":[239],"are":[244],"available":[245],"at":[246],"https://github.com/tanguymagne/UVDoc.":[247]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
