{"id":"https://openalex.org/W4393899832","doi":"https://doi.org/10.1117/12.3023177","title":"SAIGAN: arbitrary length and out-of-vocabulary handwriting synthesis preserving geometrical annotation","display_name":"SAIGAN: arbitrary length and out-of-vocabulary handwriting synthesis preserving geometrical annotation","publication_year":2024,"publication_date":"2024-04-03","ids":{"openalex":"https://openalex.org/W4393899832","doi":"https://doi.org/10.1117/12.3023177"},"language":"en","primary_location":{"id":"doi:10.1117/12.3023177","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1117/12.3023177","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Sixteenth International Conference on Machine Vision (ICMV 2023)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5094361669","display_name":"Konstantin K. Suloev","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Konstantin K. Suloev","raw_affiliation_strings":["Smart Engines Service LLC (Russian Federation)"],"affiliations":[{"raw_affiliation_string":"Smart Engines Service LLC (Russian Federation)","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023584111","display_name":"Yulia S. Chernyshova","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yulia S. Chernyshova","raw_affiliation_strings":["Federal Research Center \u201cComputer Science and Control\u201d (Russian Federation)","Smart Engines Service LLC (Russian Federation)","Federal Research Center \"Computer Science and Control\" (Russian Federation)"],"affiliations":[{"raw_affiliation_string":"Federal Research Center \u201cComputer Science and Control\u201d (Russian Federation)","institution_ids":[]},{"raw_affiliation_string":"Smart Engines Service LLC (Russian Federation)","institution_ids":[]},{"raw_affiliation_string":"Federal Research Center \"Computer Science and Control\" (Russian Federation)","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070598827","display_name":"Alexander Sheshkus","orcid":"https://orcid.org/0000-0002-8970-8747"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alexander V. Sheshkus","raw_affiliation_strings":["Federal Research Center \u201cComputer Science and Control\u201d (Russian Federation)","Smart Engines Service LLC (Russian Federation)","Federal Research Center \"Computer Science and Control\" (Russian Federation)"],"affiliations":[{"raw_affiliation_string":"Federal Research Center \u201cComputer Science and Control\u201d (Russian Federation)","institution_ids":[]},{"raw_affiliation_string":"Smart Engines Service LLC (Russian Federation)","institution_ids":[]},{"raw_affiliation_string":"Federal Research Center \"Computer Science and Control\" (Russian Federation)","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5094361669"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.03687652,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"11433","issue":null,"first_page":"4","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/handwriting","display_name":"Handwriting","score":0.8580703735351562},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7735418081283569},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.6710761785507202},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.6695306897163391},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.6525212526321411},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5925742387771606},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5841187238693237},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5592745542526245},{"id":"https://openalex.org/keywords/handwriting-recognition","display_name":"Handwriting recognition","score":0.542669415473938},{"id":"https://openalex.org/keywords/intelligent-character-recognition","display_name":"Intelligent character recognition","score":0.4877517819404602},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.46294865012168884},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4575338661670685},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4495285749435425},{"id":"https://openalex.org/keywords/mnist-database","display_name":"MNIST database","score":0.43140149116516113},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.4313703775405884},{"id":"https://openalex.org/keywords/style","display_name":"Style (visual arts)","score":0.4263265132904053},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3872659504413605},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3820209801197052},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.31691303849220276},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.27522557973861694},{"id":"https://openalex.org/keywords/character-recognition","display_name":"Character recognition","score":0.17037636041641235},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10503262281417847},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.0857161283493042}],"concepts":[{"id":"https://openalex.org/C2779386606","wikidata":"https://www.wikidata.org/wiki/Q2393642","display_name":"Handwriting","level":2,"score":0.8580703735351562},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7735418081283569},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.6710761785507202},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.6695306897163391},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.6525212526321411},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5925742387771606},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5841187238693237},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5592745542526245},{"id":"https://openalex.org/C112640561","wikidata":"https://www.wikidata.org/wiki/Q2440634","display_name":"Handwriting recognition","level":3,"score":0.542669415473938},{"id":"https://openalex.org/C44868376","wikidata":"https://www.wikidata.org/wiki/Q3099089","display_name":"Intelligent character recognition","level":4,"score":0.4877517819404602},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.46294865012168884},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4575338661670685},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4495285749435425},{"id":"https://openalex.org/C190502265","wikidata":"https://www.wikidata.org/wiki/Q17069496","display_name":"MNIST database","level":3,"score":0.43140149116516113},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.4313703775405884},{"id":"https://openalex.org/C2776445246","wikidata":"https://www.wikidata.org/wiki/Q1792644","display_name":"Style (visual arts)","level":2,"score":0.4263265132904053},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3872659504413605},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3820209801197052},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.31691303849220276},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.27522557973861694},{"id":"https://openalex.org/C2987247673","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Character recognition","level":3,"score":0.17037636041641235},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10503262281417847},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0857161283493042},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1117/12.3023177","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1117/12.3023177","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Sixteenth International Conference on Machine Vision (ICMV 2023)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5400000214576721}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1810943226","https://openalex.org/W2064675550","https://openalex.org/W2127141656","https://openalex.org/W2157331557","https://openalex.org/W2899771611","https://openalex.org/W2963047498","https://openalex.org/W3003307646","https://openalex.org/W3003343025","https://openalex.org/W3003915459","https://openalex.org/W3003967978","https://openalex.org/W3109645351","https://openalex.org/W4250685322","https://openalex.org/W4288049477","https://openalex.org/W4289751412","https://openalex.org/W4301206121","https://openalex.org/W4323833492","https://openalex.org/W6631190155","https://openalex.org/W6638273328","https://openalex.org/W6683258052","https://openalex.org/W6753558063","https://openalex.org/W6756040250","https://openalex.org/W6759777974","https://openalex.org/W6760811728","https://openalex.org/W6761851811","https://openalex.org/W6765779288","https://openalex.org/W6773446742","https://openalex.org/W6774349176","https://openalex.org/W6775628630","https://openalex.org/W6796866110","https://openalex.org/W6808826384"],"related_works":["https://openalex.org/W3047607512","https://openalex.org/W3003949997","https://openalex.org/W4390983538","https://openalex.org/W2110485610","https://openalex.org/W4327773476","https://openalex.org/W183832189","https://openalex.org/W2011042697","https://openalex.org/W2135329887","https://openalex.org/W4366502683","https://openalex.org/W2406729210"],"abstract_inverted_index":{"Handwritten":[0],"text":[1,98],"recognition":[2],"(HTR)":[3],"is":[4,25,33,125],"a":[5,10],"challenging":[6],"task":[7],"that":[8,34],"requires":[9,37],"large":[11],"amount":[12],"of":[13,18,28,50,115],"diverse":[14],"training":[15,40],"data.":[16],"One":[17],"the":[19,26,35,45,58,75,92,96,102,109,147],"possible":[20,127],"approaches":[21],"to":[22,70,128,145],"this":[23],"problem":[24],"adoption":[27],"CNNs.":[29],"The":[30],"key":[31],"challenge":[32],"CNN":[36],"geometrically":[38],"labeled":[39],"data,":[41],"which":[42,66],"may":[43],"increase":[44],"cost":[46],"and":[47,111,119],"time":[48],"consumption":[49],"labeling.":[51],"To":[52],"overcome":[53],"these":[54],"limitations":[55],"we":[56],"propose":[57],"method,":[59],"based":[60],"on":[61,108],"<i>Generative":[62],"Adversarial":[63],"Network</i>":[64],"(GAN),":[65],"transfers":[67],"handwriting":[68,131],"styles":[69,132],"printed":[71,84],"style":[72,85,140],"images,":[73],"preserving":[74],"Same":[76],"geometrical":[77],"Annotation":[78],"as":[79,87],"Input":[80],"-":[81],"SAIGAN.":[82],"Taking":[83],"image":[86,94],"an":[88,116],"input,":[89],"it":[90,124],"produces":[91],"handwritten":[93],"with":[95],"same":[97,103],"content":[99],"located":[100],"in":[101],"positions.":[104],"Our":[105],"method":[106],"operates":[107],"character-level":[110],"can":[112],"produce":[113],"sequences":[114],"arbitrary":[117],"length":[118],"any":[120],"content.":[121],"Once":[122],"trained,":[123],"also":[126],"generate":[129],"new":[130],"by":[133],"simply":[134],"manipulating":[135],"latent":[136],"vectors.":[137],"Proposed":[138],"character":[139],"supervision":[141],"allowed":[142],"our":[143],"model":[144],"surpass":[146],"basis":[148],"method.":[149]},"counts_by_year":[],"updated_date":"2025-12-26T23:08:49.675405","created_date":"2025-10-10T00:00:00"}
