{"id":"https://openalex.org/W4294658751","doi":"https://doi.org/10.18293/seke2022-086","title":"Data Selection for Cross-Project Defect Prediction with Local and Global Features of Source Code","display_name":"Data Selection for Cross-Project Defect Prediction with Local and Global Features of Source Code","publication_year":2022,"publication_date":"2022-07-01","ids":{"openalex":"https://openalex.org/W4294658751","doi":"https://doi.org/10.18293/seke2022-086"},"language":"en","primary_location":{"id":"doi:10.18293/seke2022-086","is_oa":true,"landing_page_url":"http://doi.org/10.18293/seke2022-086","pdf_url":"https://doi.org/10.18293/seke2022-086","source":{"id":"https://openalex.org/S4220650826","display_name":"Proceedings/Proceedings of the ... International Conference on Software Engineering and Knowledge Engineering","issn_l":"2325-9000","issn":["2325-9000","2325-9086"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Conferences on Software Engineering and Knowledge Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://doi.org/10.18293/seke2022-086","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101981890","display_name":"Xuan Deng","orcid":"https://orcid.org/0000-0001-9926-5612"},"institutions":[{"id":"https://openalex.org/I75900474","display_name":"Hubei University","ror":"https://ror.org/03a60m280","country_code":"CN","type":"education","lineage":["https://openalex.org/I75900474"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xuan Deng","raw_affiliation_strings":["Information Engineering Hubei University Wuhan, China","School of Computer Science and"],"affiliations":[{"raw_affiliation_string":"Information Engineering Hubei University Wuhan, China","institution_ids":["https://openalex.org/I75900474"]},{"raw_affiliation_string":"School of Computer Science and","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100459648","display_name":"Peng He","orcid":null},"institutions":[{"id":"https://openalex.org/I75900474","display_name":"Hubei University","ror":"https://ror.org/03a60m280","country_code":"CN","type":"education","lineage":["https://openalex.org/I75900474"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng He","raw_affiliation_strings":["Information Engineering Hubei University Wuhan, China","School of Computer Science and"],"affiliations":[{"raw_affiliation_string":"Information Engineering Hubei University Wuhan, China","institution_ids":["https://openalex.org/I75900474"]},{"raw_affiliation_string":"School of Computer Science and","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108408745","display_name":"Chun Ying Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I75900474","display_name":"Hubei University","ror":"https://ror.org/03a60m280","country_code":"CN","type":"education","lineage":["https://openalex.org/I75900474"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chun Ying Zhou","raw_affiliation_strings":["School of Computer Science and","Information Engineering Hubei University Wuhan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and","institution_ids":[]},{"raw_affiliation_string":"Information Engineering Hubei University Wuhan, China","institution_ids":["https://openalex.org/I75900474"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101981890"],"corresponding_institution_ids":["https://openalex.org/I75900474"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14902502,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"2022","issue":null,"first_page":"216","last_page":"219"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10430","display_name":"Software Engineering Techniques and Practices","score":0.9797000288963318,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8547636866569519},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6457501649856567},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6205072999000549},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5798674821853638},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.5473704934120178},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5438833832740784},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5287373065948486},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4987764358520508},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4789605438709259},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.43918848037719727},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43481796979904175},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09231698513031006}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8547636866569519},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6457501649856567},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6205072999000549},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5798674821853638},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.5473704934120178},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5438833832740784},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5287373065948486},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4987764358520508},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4789605438709259},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.43918848037719727},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43481796979904175},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09231698513031006},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18293/seke2022-086","is_oa":true,"landing_page_url":"http://doi.org/10.18293/seke2022-086","pdf_url":"https://doi.org/10.18293/seke2022-086","source":{"id":"https://openalex.org/S4220650826","display_name":"Proceedings/Proceedings of the ... International Conference on Software Engineering and Knowledge Engineering","issn_l":"2325-9000","issn":["2325-9000","2325-9086"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Conferences on Software Engineering and Knowledge Engineering","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18293/seke2022-086","is_oa":true,"landing_page_url":"http://doi.org/10.18293/seke2022-086","pdf_url":"https://doi.org/10.18293/seke2022-086","source":{"id":"https://openalex.org/S4220650826","display_name":"Proceedings/Proceedings of the ... International Conference on Software Engineering and Knowledge Engineering","issn_l":"2325-9000","issn":["2325-9000","2325-9086"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Conferences on Software Engineering and Knowledge Engineering","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Partnerships for the goals","score":0.41999998688697815,"id":"https://metadata.un.org/sdg/17"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4294658751.pdf","grobid_xml":"https://content.openalex.org/works/W4294658751.grobid-xml"},"referenced_works_count":10,"referenced_works":["https://openalex.org/W2192239100","https://openalex.org/W2666681845","https://openalex.org/W2774451924","https://openalex.org/W2807296583","https://openalex.org/W2888348590","https://openalex.org/W2898435572","https://openalex.org/W2964205113","https://openalex.org/W3139562078","https://openalex.org/W4211259380","https://openalex.org/W4297571622"],"related_works":["https://openalex.org/W2468279273","https://openalex.org/W2354198838","https://openalex.org/W1989130879","https://openalex.org/W2103419012","https://openalex.org/W2988126442","https://openalex.org/W1974414866","https://openalex.org/W2057568687","https://openalex.org/W2063982682","https://openalex.org/W2338543196","https://openalex.org/W3081644756"],"abstract_inverted_index":{"An":[0],"open":[1],"challenge":[2],"for":[3,17,67,75,107,151],"cross-project":[4],"defect":[5,131],"prediction":[6],"(CPDP)":[7],"is":[8,54,61],"how":[9],"to":[10,20,55,85,145],"select":[11],"the":[12,41,47,88,101,104,114,121,135,147,169,176,184],"most":[13],"appropriate":[14],"training":[15,76,148],"data":[16,77,108,149],"target":[18],"project":[19],"build":[21],"quality":[22],"predictor.":[23],"To":[24],"our":[25,162],"knowledge,":[26],"existing":[27],"methods":[28],"are":[29],"mostly":[30],"dominated":[31],"by":[32,118],"traditional":[33,122,170],"hand-crafted":[34],"features,":[35],"which":[36,60],"do":[37],"not":[38],"fully":[39],"encode":[40],"global":[42,92,180],"structure":[43],"between":[44],"codes":[45],"nor":[46],"semantics":[48],"of":[49,63,95,103,116,159,186,192],"code":[50,96,187],"tokens.":[51],"This":[52],"work":[53],"propose":[56,81],"an":[57],"improved":[58],"method":[59,143,163],"capable":[62],"automatically":[64,86],"learning":[65],"features":[66,94,106,182],"representing":[68],"source":[69],"code,":[70],"and":[71,91,153,179],"uses":[72],"these":[73],"feataures":[74],"selection.":[78,109],"First,":[79],"we":[80,99,111],"a":[82,155],"framework":[83],"ALGoF":[84,117,142],"learn":[87],"local":[89,177],"semantic":[90,178],"structural":[93,181],"files.":[97,188],"Then,":[98],"analyze":[100],"feasibility":[102],"learned":[105],"Besides,":[110],"also":[112],"validate":[113],"effectiveness":[115],"comparing":[119],"with":[120],"method.":[123],"The":[124,138,189],"experiments":[125],"have":[126],"been":[127],"conducted":[128],"on":[129],"six":[130],"datasets":[132],"available":[133],"at":[134],"PROMISE":[136],"repository.":[137],"results":[139],"show":[140],"that":[141],"helps":[144],"guide":[146],"selection":[150],"CPDP,":[152],"achieves":[154],"48.31%":[156],"improvement":[157,191],"rate":[158],"F-measure.":[160],"Meanwhile,":[161],"has":[164],"statistically":[165],"significant":[166],"advantages":[167],"over":[168],"method,":[171],"especially":[172],"when":[173],"using":[174],"both":[175],"as":[183],"representation":[185],"maximum":[190],"F-measure":[193],"can":[194],"reach":[195],"42.6%.":[196]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
