{"id":"https://openalex.org/W3104859925","doi":"https://doi.org/10.1145/3368089.3417067","title":"Clustering test steps in natural language toward automating test automation","display_name":"Clustering test steps in natural language toward automating test automation","publication_year":2020,"publication_date":"2020-11-08","ids":{"openalex":"https://openalex.org/W3104859925","doi":"https://doi.org/10.1145/3368089.3417067","mag":"3104859925"},"language":"en","primary_location":{"id":"doi:10.1145/3368089.3417067","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3368089.3417067","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM Joint Meeting on European Software Engineering Conference and Symposium on the Foundations of Software Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101915882","display_name":"Linyi Li","orcid":"https://orcid.org/0000-0002-5403-3217"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Linyi Li","raw_affiliation_strings":["University of Illinois at Urbana-Champaign, USA"],"raw_orcid":"https://orcid.org/0000-0002-5403-3217","affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048146501","display_name":"Zhenwen Li","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenwen Li","raw_affiliation_strings":["Peking University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100366508","display_name":"Weijie Zhang","orcid":"https://orcid.org/0009-0003-0755-6140"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weijie Zhang","raw_affiliation_strings":["Tencent, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006051150","display_name":"Jun Zhou","orcid":"https://orcid.org/0000-0002-5545-2659"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Zhou","raw_affiliation_strings":["Tencent, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100441267","display_name":"Pengcheng Wang","orcid":"https://orcid.org/0000-0001-5398-5956"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengcheng Wang","raw_affiliation_strings":["Tencent, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101457424","display_name":"Jing Wu","orcid":"https://orcid.org/0000-0001-7430-7003"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Wu","raw_affiliation_strings":["Tencent, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070223606","display_name":"Guanghua He","orcid":"https://orcid.org/0000-0001-9494-4712"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanghua He","raw_affiliation_strings":["Tencent, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113789363","display_name":"Xia Zeng","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xia Zeng","raw_affiliation_strings":["Tencent, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060932650","display_name":"Yuetang Deng","orcid":"https://orcid.org/0009-0003-7060-4109"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuetang Deng","raw_affiliation_strings":["Tencent, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048118068","display_name":"Tao Xie","orcid":"https://orcid.org/0000-0002-6731-216X"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Xie","raw_affiliation_strings":["Peking University, China"],"raw_orcid":"https://orcid.org/0000-0002-6731-216X","affiliations":[{"raw_affiliation_string":"Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5101915882"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":2.2432,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.8845077,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1285","last_page":"1295"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7991894483566284},{"id":"https://openalex.org/keywords/test-script","display_name":"Test script","score":0.7289246916770935},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6990504264831543},{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.6717833280563354},{"id":"https://openalex.org/keywords/test-management-approach","display_name":"Test Management Approach","score":0.6472923755645752},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.6288711428642273},{"id":"https://openalex.org/keywords/test-case","display_name":"Test case","score":0.6071956157684326},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.5834856629371643},{"id":"https://openalex.org/keywords/test-harness","display_name":"Test harness","score":0.5744159817695618},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4122329652309418},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3869548439979553},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.31211626529693604},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.1998494267463684},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.18224963545799255},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11935418844223022},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.0949249267578125}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7991894483566284},{"id":"https://openalex.org/C109086967","wikidata":"https://www.wikidata.org/wiki/Q2509100","display_name":"Test script","level":4,"score":0.7289246916770935},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6990504264831543},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.6717833280563354},{"id":"https://openalex.org/C7435765","wikidata":"https://www.wikidata.org/wiki/Q7705776","display_name":"Test Management Approach","level":5,"score":0.6472923755645752},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.6288711428642273},{"id":"https://openalex.org/C128942645","wikidata":"https://www.wikidata.org/wiki/Q1568346","display_name":"Test case","level":3,"score":0.6071956157684326},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.5834856629371643},{"id":"https://openalex.org/C109852812","wikidata":"https://www.wikidata.org/wiki/Q2406355","display_name":"Test harness","level":5,"score":0.5744159817695618},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4122329652309418},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3869548439979553},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.31211626529693604},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.1998494267463684},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.18224963545799255},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11935418844223022},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.0949249267578125},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.0},{"id":"https://openalex.org/C186846655","wikidata":"https://www.wikidata.org/wiki/Q3398377","display_name":"Software construction","level":4,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3368089.3417067","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3368089.3417067","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th ACM Joint Meeting on European Software Engineering Conference and Symposium on the Foundations of Software Engineering","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.5199999809265137,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W658020064","https://openalex.org/W1498436455","https://openalex.org/W1532325895","https://openalex.org/W1545355820","https://openalex.org/W1598796236","https://openalex.org/W1632114991","https://openalex.org/W1673310716","https://openalex.org/W1736726159","https://openalex.org/W1982488509","https://openalex.org/W1992419399","https://openalex.org/W1996430422","https://openalex.org/W2034627179","https://openalex.org/W2064675550","https://openalex.org/W2087634802","https://openalex.org/W2097998348","https://openalex.org/W2108021205","https://openalex.org/W2113667150","https://openalex.org/W2120636621","https://openalex.org/W2126330798","https://openalex.org/W2131123443","https://openalex.org/W2135239686","https://openalex.org/W2139801247","https://openalex.org/W2144578941","https://openalex.org/W2150593711","https://openalex.org/W2153579005","https://openalex.org/W2241862190","https://openalex.org/W2407776548","https://openalex.org/W2591252546","https://openalex.org/W2888728157","https://openalex.org/W2895351178","https://openalex.org/W2949547296","https://openalex.org/W2963341956","https://openalex.org/W2963403868","https://openalex.org/W3003558015","https://openalex.org/W3143507502","https://openalex.org/W4237602274","https://openalex.org/W4238882151","https://openalex.org/W6674385629"],"related_works":["https://openalex.org/W2949730628","https://openalex.org/W2392299784","https://openalex.org/W3006257721","https://openalex.org/W2109315538","https://openalex.org/W2996721186","https://openalex.org/W2149419207","https://openalex.org/W2161222901","https://openalex.org/W86846735","https://openalex.org/W2243231242","https://openalex.org/W3023720272"],"abstract_inverted_index":{"For":[0],"large":[1,236],"industrial":[2,237],"applications,":[3],"system":[4],"test":[5,28,31,41,46,54,62,68,73,79,84,89,93,96,113,129,138,164,170,181,204,248,290],"cases":[6],"are":[7],"still":[8],"often":[9],"described":[10],"in":[11,115,147,172],"natural":[12,157],"language":[13,158],"(NL),":[14],"and":[15,75,131,217,224,259],"their":[16],"number":[17,256,283,288],"can":[18,98,175,245],"reach":[19],"thousands.":[20],"Test":[21],"automation":[22,32],"is":[23],"to":[24,104,111,135,160,178,199,212,221,293],"automatically":[25],"execute":[26],"the":[27,105,169,179,201,247,255,262,270,287],"cases.":[29,47],"Achieving":[30],"typically":[33],"requires":[34],"substantial":[35],"manual":[36,120,264],"effort":[37,134],"for":[38,71,81,88,141],"creating":[39],"executable":[40],"scripts":[42],"from":[43],"these":[44,83],"NL":[45,53,61,117,163],"In":[48,266],"particular,":[49,267],"given":[50],"that":[51,168,242],"each":[52,72,173],"case":[55],"consists":[56],"of":[57,60,203,231,257,284,289],"a":[58,67,78,152,210,235],"sequence":[59],"steps,":[63],"testers":[64,122],"first":[65],"implement":[66,136],"API":[69,85,107,139,182,291],"method":[70],"step":[74],"then":[76],"write":[77],"script":[80],"invoking":[82],"methods":[86,140,292],"sequentially":[87],"automation.":[90],"Across":[91],"different":[92],"cases,":[94],"multiple":[95],"steps":[97,114,130,165,171,249],"share":[99],"semantic":[100],"similarities,":[101],"supposedly":[102],"mapped":[103,177],"same":[106,180],"method.":[108,183],"However,":[109],"due":[110],"numerous":[112],"various":[116],"forms":[118],"under":[119],"inspection,":[121],"may":[123],"not":[124],"realize":[125],"those":[126],"semantically":[127],"similar":[128,162],"thus":[132,260],"waste":[133],"duplicate":[137],"them.":[142],"To":[143],"address":[144],"this":[145,148],"issue,":[146],"paper,":[149],"we":[150],"propose":[151],"new":[153],"approach":[154,185,207,233,244,274],"based":[155,194],"on":[156,195,234,278],"processing":[159],"cluster":[161,174,246,279],"together":[166],"such":[167],"be":[176,294],"Our":[184,206],"includes":[186,209],"domain-specific":[187],"word":[188],"embedding":[189],"training":[190],"along":[191],"with":[192,250,269],"measurement":[193],"Relaxed":[196],"Word":[197],"Mover\u2019sDistance":[198],"analyze":[200],"similarity":[202],"steps.":[205],"also":[208],"technique":[211],"combine":[213],"hierarchical":[214],"agglomerative":[215],"clustering":[216,219,226],"K-means":[218],"post-refinement":[220],"derive":[222],"high-quality":[223],"manually-adjustable":[225],"results.":[227],"The":[228],"evaluation":[229],"results":[230],"our":[232,243,273],"mobile":[238],"app,":[239],"WeChat,":[240],"show":[241],"high":[251],"accuracy,":[252],"substantially":[253],"reducing":[254,261,281],"clusters":[258],"downstream":[263],"effort.":[265],"compared":[268],"baseline":[271],"approach,":[272],"achieves":[275],"79.8%":[276],"improvement":[277],"quality,":[280],"65.9%":[282],"clusters,":[285],"i.e.,":[286],"implemented.":[295]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":6}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
