{"id":"https://openalex.org/W3033209696","doi":"https://doi.org/10.1145/3392093","title":"psc2code","display_name":"psc2code","publication_year":2020,"publication_date":"2020-06-01","ids":{"openalex":"https://openalex.org/W3033209696","doi":"https://doi.org/10.1145/3392093","mag":"3033209696"},"language":"en","primary_location":{"id":"doi:10.1145/3392093","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3392093","pdf_url":null,"source":{"id":"https://openalex.org/S142627899","display_name":"ACM Transactions on Software Engineering and Methodology","issn_l":"1049-331X","issn":["1049-331X","1557-7392"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Software Engineering and Methodology","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2103.11610","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007075465","display_name":"Lingfeng Bao","orcid":"https://orcid.org/0000-0003-1846-0921"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]},{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lingfeng Bao","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, China and Ningbo Research Institute, Zhejiang University, China and PengCheng Laboratory, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, China and Ningbo Research Institute, Zhejiang University, China and PengCheng Laboratory, China","institution_ids":["https://openalex.org/I76130692","https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028641941","display_name":"Zhenchang Xing","orcid":"https://orcid.org/0000-0001-7663-1421"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Zhenchang Xing","raw_affiliation_strings":["Australian National University, Australia"],"affiliations":[{"raw_affiliation_string":"Australian National University, Australia","institution_ids":["https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006669765","display_name":"Xin Xia","orcid":"https://orcid.org/0000-0002-6302-3256"},"institutions":[{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Xin Xia","raw_affiliation_strings":["Monash University, Australia"],"affiliations":[{"raw_affiliation_string":"Monash University, Australia","institution_ids":["https://openalex.org/I56590836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081036622","display_name":"David Lo","orcid":"https://orcid.org/0000-0002-4367-7201"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"David Lo","raw_affiliation_strings":["Singapore Management University, Singapore"],"affiliations":[{"raw_affiliation_string":"Singapore Management University, Singapore","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101925641","display_name":"Minghui Wu","orcid":"https://orcid.org/0000-0001-8179-7119"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Minghui Wu","raw_affiliation_strings":["Zhejiang University City College, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University City College, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101577570","display_name":"Xiaohu Yang","orcid":"https://orcid.org/0000-0003-4111-4189"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaohu Yang","raw_affiliation_strings":["Zhejiang University, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5007075465"],"corresponding_institution_ids":["https://openalex.org/I4210136793","https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":4.1724,"has_fulltext":false,"cited_by_count":25,"citation_normalized_percentile":{"value":0.94797804,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"29","issue":"3","first_page":"1","last_page":"38"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9779999852180481,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9555000066757202,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8862425088882446},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.6920099854469299},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.5165244936943054},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49840283393859863},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4920505881309509},{"id":"https://openalex.org/keywords/identifier","display_name":"Identifier","score":0.4520249366760254},{"id":"https://openalex.org/keywords/computer-programming","display_name":"Computer programming","score":0.4423605501651764},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4249749481678009},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.394214391708374},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.19978004693984985},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.17571315169334412}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8862425088882446},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.6920099854469299},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.5165244936943054},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49840283393859863},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4920505881309509},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.4520249366760254},{"id":"https://openalex.org/C33857546","wikidata":"https://www.wikidata.org/wiki/Q80006","display_name":"Computer programming","level":2,"score":0.4423605501651764},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4249749481678009},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.394214391708374},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.19978004693984985},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.17571315169334412},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/3392093","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3392093","pdf_url":null,"source":{"id":"https://openalex.org/S142627899","display_name":"ACM Transactions on Software Engineering and Methodology","issn_l":"1049-331X","issn":["1049-331X","1557-7392"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Software Engineering and Methodology","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2103.11610","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.11610","pdf_url":"https://arxiv.org/pdf/2103.11610","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:ink.library.smu.edu.sg:sis_research-6624","is_oa":false,"landing_page_url":"https://ink.library.smu.edu.sg/sis_research/5621","pdf_url":null,"source":{"id":"https://openalex.org/S4377196871","display_name":"Institutional Knowledge (InK) - Institutional Knowledge at Singapore Management University (Singapore Management University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79891267","host_organization_name":"Singapore Management University","host_organization_lineage":["https://openalex.org/I79891267"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://doi.org/10.1145/3392093","raw_type":"Journal Article"},{"id":"doi:10.48550/arxiv.2103.11610","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2103.11610","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2103.11610","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.11610","pdf_url":"https://arxiv.org/pdf/2103.11610","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G964035141","display_name":null,"funder_award_id":"61972339 and 61902344","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W7746136","https://openalex.org/W1660390307","https://openalex.org/W1673310716","https://openalex.org/W1973501456","https://openalex.org/W1975879668","https://openalex.org/W2035965376","https://openalex.org/W2051525497","https://openalex.org/W2073426284","https://openalex.org/W2081479026","https://openalex.org/W2081845926","https://openalex.org/W2089759055","https://openalex.org/W2116737258","https://openalex.org/W2141125339","https://openalex.org/W2145023731","https://openalex.org/W2148615889","https://openalex.org/W2155912251","https://openalex.org/W2158447593","https://openalex.org/W2160528879","https://openalex.org/W2162939096","https://openalex.org/W2244385525","https://openalex.org/W2271359621","https://openalex.org/W2376637698","https://openalex.org/W2517817194","https://openalex.org/W2532717157","https://openalex.org/W2774526117","https://openalex.org/W2789980854","https://openalex.org/W2808909528","https://openalex.org/W2883213995","https://openalex.org/W2883305011","https://openalex.org/W2883811619","https://openalex.org/W2896459014","https://openalex.org/W2947510423","https://openalex.org/W2963037989","https://openalex.org/W2992939092","https://openalex.org/W3149255455","https://openalex.org/W4211214670","https://openalex.org/W4244606080","https://openalex.org/W4250533120","https://openalex.org/W4252684946"],"related_works":["https://openalex.org/W4378651134","https://openalex.org/W4252684102","https://openalex.org/W2352307597","https://openalex.org/W1979633005","https://openalex.org/W2163724607","https://openalex.org/W3120493416","https://openalex.org/W2098192829","https://openalex.org/W2772430765","https://openalex.org/W3089461718","https://openalex.org/W2312318148"],"abstract_inverted_index":{"Programming":[0],"screencasts":[1,24,39,316],"have":[2],"become":[3],"a":[4,41,235,257,266,295,384,432],"pervasive":[5],"resource":[6],"on":[7,240,313,341,371,397],"the":[8,34,47,54,58,63,96,137,167,172,178,196,208,241,248,263,275,281,286,290,305,330,342,354,357,372,398,403,418,458,461],"Internet,":[9],"which":[10,82,335],"help":[11,455],"developers":[12,50],"learn":[13,457],"new":[14],"programming":[15,23,38,183,203,287,315,385,392,406,413,438,462],"technologies":[16],"or":[17],"skills.":[18],"The":[19,159],"source":[20,55,99,152,162,179,200,272,299,307,359,373,399],"code":[21,56,100,126,129,138,153,163,180,201,236,258,273,277,300,344,360,374,400],"in":[22,57,130,182,234,285,304,460],"is":[25,252],"an":[26,190,311,337,390],"important":[27],"and":[28,87,124,175,219,227,238,246,279,289,332,421,426,466],"valuable":[29],"information":[30,284],"for":[31,104],"developers.":[32],"But":[33],"streaming":[35],"nature":[36],"of":[37,43,98,113,177,198,265,294,298,339,356,366,423,435],"(i.e.,":[40],"sequence":[42],"screen-captured":[44],"images)":[45],"limits":[46],"ways":[48],"that":[49,251,321,349,411,449],"can":[51,83,327,351,454],"interact":[52],"with":[53,128,442],"screencasts.":[59,184,204],"Many":[60],"studies":[61],"use":[62],"Optical":[64],"Character":[65],"Recognition":[66],"(OCR)":[67],"technique":[68,326],"to":[69,75,136,194,216,231,255,270,301],"convert":[70],"screen":[71,92,157,249],"images":[72,93],"(also":[73],"referred":[74],"as":[76,171],"video":[77,463],"frames)":[78],"into":[79],"textual":[80],"content,":[81],"then":[84],"be":[85,256],"indexed":[86],"searched":[88],"easily.":[89],"However,":[90],"noisy":[91,125,160],"significantly":[94,352],"affect":[95,166],"quality":[97,355],"extracted":[101,401],"by":[102,361,376],"OCR,":[103],"example,":[105],"no-code":[106],"frames":[107],"(e.g.,":[108,118,140],"PowerPoint":[109],"slides,":[110],"web":[111],"pages":[112],"API":[114,264],"specification),":[115],"non-code":[116,218,331],"regions":[117,127,278],"Package":[119],"Explorer":[120],"view,":[121],"Console":[122],"view),":[123],"completion":[131],"suggestion":[132],"popups.":[133],"Furthermore,":[134],"due":[135],"characteristics":[139],"long":[141],"compound":[142],"identifiers":[143],"like":[144],"ItemListener),":[145],"even":[146],"professional":[147,267],"OCR":[148,268],"tools":[149],"cannot":[150],"extract":[151,271],"without":[154],"errors":[155,303],"from":[156,202,274,317,402],"images.":[158],"OCRed":[161,282,306,358,368],"will":[164],"negatively":[165],"downstream":[168],"applications,":[169],"such":[170],"effective":[173],"search":[174,387,415],"navigation":[176],"content":[181],"In":[185],"this":[186],"article,":[187],"we":[188,379],"propose":[189],"approach":[191],"named":[192],"psc2code":[193,206,223,261,350,377],"denoise":[195],"process":[197],"extracting":[199],"First,":[205],"leverages":[207,280],"Convolutional":[209],"Neural":[210],"Network":[211],"(CNN)":[212],"based":[213,239],"image":[214,229,324],"classification":[215,325],"remove":[217,329],"noisy-code":[220,333],"frames.":[221,345],"Then,":[222],"performs":[224],"edge":[225],"detection":[226],"clustering-based":[228],"segmentation":[230],"detect":[232],"sub-windows":[233],"frame,":[237],"detected":[242],"sub-windows,":[243],"it":[244],"identifies":[245],"crops":[247],"region":[250],"most":[253],"likely":[254],"editor.":[259],"Finally,":[260],"calls":[262],"tool":[269,441,453],"cropped":[276],"cross-frame":[283],"screencast":[288,386,393,414,439],"statistical":[291],"language":[292],"model":[293],"large":[296],"corpus":[297],"correct":[302],"code.":[308],"We":[309,319,346,429],"conduct":[310,431],"experiment":[312],"1,142":[314,404],"YouTube.":[318],"find":[320,348],"our":[322,408,412,436,450],"CNN-based":[323],"effectively":[328],"frames,":[334],"achieves":[336,417],"F1-score":[338],"0.95":[340],"valid":[343],"also":[347,430],"improve":[353],"truly":[362],"correcting":[363],"about":[364],"half":[365],"incorrectly":[367],"words.":[369],"Based":[370,396],"denoised":[375],",":[378],"implement":[380],"two":[381],"applications:":[382],"(1)":[383],"engine;":[388],"(2)":[389],"interaction-enhanced":[391,437,451],"watching":[394,440,452],"tool.":[395],"collected":[405],"screencasts,":[407],"experiments":[409],"show":[410],"engine":[416],"precision@5,":[419],"10,":[420],"20":[422],"0.93,":[424],"0.81,":[425],"0.63,":[427],"respectively.":[428],"user":[433,446],"study":[434,447],"10":[443],"participants.":[444],"This":[445],"shows":[448],"participants":[456],"knowledge":[459],"more":[464],"efficiently":[465],"effectively.":[467]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2020-06-12T00:00:00"}
