{"id":"https://openalex.org/W3015959778","doi":"https://doi.org/10.1109/icassp40776.2020.9054360","title":"Adversarial Text Image Super-Resolution using Sinkhorn Distance","display_name":"Adversarial Text Image Super-Resolution using Sinkhorn Distance","publication_year":2020,"publication_date":"2020-04-09","ids":{"openalex":"https://openalex.org/W3015959778","doi":"https://doi.org/10.1109/icassp40776.2020.9054360","mag":"3015959778"},"language":"en","primary_location":{"id":"doi:10.1109/icassp40776.2020.9054360","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9054360","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107885738","display_name":"Cong Geng","orcid":"https://orcid.org/0000-0002-3129-8941"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Cong Geng","raw_affiliation_strings":["Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100379203","display_name":"Li Chen","orcid":"https://orcid.org/0000-0001-9899-2535"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Chen","raw_affiliation_strings":["Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100452809","display_name":"Xiaoyun Zhang","orcid":"https://orcid.org/0000-0001-7680-4062"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyun Zhang","raw_affiliation_strings":["Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101926731","display_name":"Zhiyong Gao","orcid":"https://orcid.org/0000-0003-4204-6536"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Gao","raw_affiliation_strings":["Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Institute of Image Communication and Network Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5107885738"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.3908,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.60319621,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"2663","last_page":"2667"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.984499990940094,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7702351808547974},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.6015528440475464},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5231279730796814},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5226231217384338},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.49472281336784363},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.48942461609840393},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.47619616985321045},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.4514358639717102},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4169151186943054},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3592568039894104},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3581993579864502},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3510705232620239}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7702351808547974},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.6015528440475464},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5231279730796814},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5226231217384338},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.49472281336784363},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.48942461609840393},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.47619616985321045},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.4514358639717102},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4169151186943054},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3592568039894104},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3581993579864502},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3510705232620239},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp40776.2020.9054360","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9054360","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W54257720","https://openalex.org/W935139217","https://openalex.org/W1594039573","https://openalex.org/W1775434803","https://openalex.org/W1885185971","https://openalex.org/W2072610689","https://openalex.org/W2085463895","https://openalex.org/W2103261301","https://openalex.org/W2121058967","https://openalex.org/W2158131535","https://openalex.org/W2242218935","https://openalex.org/W2331128040","https://openalex.org/W2476548250","https://openalex.org/W2542551142","https://openalex.org/W2747898905","https://openalex.org/W2792425829","https://openalex.org/W2792491038","https://openalex.org/W2794849006","https://openalex.org/W2962953661","https://openalex.org/W2963372104","https://openalex.org/W2963398399","https://openalex.org/W2963470893","https://openalex.org/W2963506485","https://openalex.org/W2963645788","https://openalex.org/W2964125708","https://openalex.org/W4293418191","https://openalex.org/W6602211262","https://openalex.org/W6624640001","https://openalex.org/W6637845829","https://openalex.org/W6682962330","https://openalex.org/W6702130928","https://openalex.org/W6729190629","https://openalex.org/W6745847804","https://openalex.org/W6749053038","https://openalex.org/W6750161017","https://openalex.org/W6756302011"],"related_works":["https://openalex.org/W4293226380","https://openalex.org/W4321487865","https://openalex.org/W4313906399","https://openalex.org/W4391266461","https://openalex.org/W2590798552","https://openalex.org/W2811106690","https://openalex.org/W4239306820","https://openalex.org/W2947043951","https://openalex.org/W4312417841","https://openalex.org/W4210874298"],"abstract_inverted_index":{"Convolutional":[0],"neural":[1],"network-based":[2],"methods":[3,14],"have":[4],"demonstrated":[5],"promising":[6],"results":[7,116],"for":[8,56],"single":[9],"image":[10],"super-resolution.":[11],"However,":[12],"existing":[13],"usually":[15],"approach":[16],"the":[17,26,41,48,85,89,107,138],"problem":[18],"on":[19,117],"natural":[20],"scenes":[21],"rather":[22],"than":[23],"texts,":[24],"whereas":[25],"latter":[27],"can":[28,105],"provide":[29],"more":[30],"informative":[31],"messages":[32],"to":[33],"viewers.":[34],"In":[35],"this":[36],"paper,":[37],"instead":[38],"of":[39,96,110],"using":[40],"L":[42],"<sub":[43],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[44],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">p</sub>":[45],"-norm":[46],"as":[47],"supervision":[49],"metric,":[50],"we":[51],"propose":[52],"a":[53,71],"novel":[54],"one":[55],"better":[57],"preserving":[58],"semantic":[59],"information":[60],"in":[61,70,78,94,129],"text":[62,118],"images.":[63],"Our":[64],"new":[65],"metric":[66,104],"combines":[67],"optimal":[68],"transport":[69],"primal":[72],"form":[73],"with":[74],"Sinkhorn":[75,86],"distance":[76,87],"defined":[77],"an":[79],"adversarially":[80],"learned":[81],"feature":[82,98],"space.":[83],"Since":[84],"measures":[88],"similarity":[90],"between":[91],"two":[92],"features":[93],"terms":[95],"both":[97,130],"components":[99],"and":[100,132,141],"spatial":[101,108],"locations,":[102],"our":[103,122],"maintain":[106],"structure":[109],"texts":[111],"during":[112],"network":[113],"optimization.":[114],"Experimental":[115],"datasets":[119],"show":[120],"that":[121],"method":[123],"performs":[124],"favorably":[125],"against":[126],"state-of-the-art":[127],"approaches":[128],"quantitative":[131],"qualitative":[133],"evaluations.":[134],"We":[135],"will":[136],"publish":[137],"code,":[139],"datasets,":[140],"models":[142],"upon":[143],"acceptance.":[144]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
