{"id":"https://openalex.org/W7124951320","doi":"https://doi.org/10.1109/aiware69974.2025.00011","title":"Understanding LLM-Driven Test Oracle Generation","display_name":"Understanding LLM-Driven Test Oracle Generation","publication_year":2025,"publication_date":"2025-11-19","ids":{"openalex":"https://openalex.org/W7124951320","doi":"https://doi.org/10.1109/aiware69974.2025.00011"},"language":null,"primary_location":{"id":"doi:10.1109/aiware69974.2025.00011","is_oa":false,"landing_page_url":"https://doi.org/10.1109/aiware69974.2025.00011","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 2nd IEEE/ACM International Conference on AI-powered Software (AIware)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123427227","display_name":"Adam Bodicoat","orcid":null},"institutions":[{"id":"https://openalex.org/I154130895","display_name":"University of Auckland","ror":"https://ror.org/03b94tp07","country_code":"NZ","type":"education","lineage":["https://openalex.org/I154130895"]}],"countries":["NZ"],"is_corresponding":true,"raw_author_name":"Adam Bodicoat","raw_affiliation_strings":["University of Auckland,Auckland,New Zealand"],"affiliations":[{"raw_affiliation_string":"University of Auckland,Auckland,New Zealand","institution_ids":["https://openalex.org/I154130895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085228874","display_name":"Gunel Jahangirova","orcid":"https://orcid.org/0000-0002-1423-1083"},"institutions":[{"id":"https://openalex.org/I183935753","display_name":"King's College London","ror":"https://ror.org/0220mzb33","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I183935753"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Gunel Jahangirova","raw_affiliation_strings":["King&#x0027;s College London,London,United Kingdom"],"affiliations":[{"raw_affiliation_string":"King&#x0027;s College London,London,United Kingdom","institution_ids":["https://openalex.org/I183935753"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5123399727","display_name":"Valerio Terragni","orcid":null},"institutions":[{"id":"https://openalex.org/I154130895","display_name":"University of Auckland","ror":"https://ror.org/03b94tp07","country_code":"NZ","type":"education","lineage":["https://openalex.org/I154130895"]}],"countries":["NZ"],"is_corresponding":false,"raw_author_name":"Valerio Terragni","raw_affiliation_strings":["University of Auckland,Auckland,New Zealand"],"affiliations":[{"raw_affiliation_string":"University of Auckland,Auckland,New Zealand","institution_ids":["https://openalex.org/I154130895"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5123427227"],"corresponding_institution_ids":["https://openalex.org/I154130895"],"apc_list":null,"apc_paid":null,"fwci":2.2675,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.91554192,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"29","last_page":"39"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9609000086784363,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9609000086784363,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.008500000461935997,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.007699999958276749,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/oracle","display_name":"Oracle","score":0.7832000255584717},{"id":"https://openalex.org/keywords/regression-testing","display_name":"Regression testing","score":0.5418999791145325},{"id":"https://openalex.org/keywords/unit-testing","display_name":"Unit testing","score":0.5375999808311462},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4431999921798706},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.41819998621940613},{"id":"https://openalex.org/keywords/software-quality","display_name":"Software quality","score":0.4178999960422516},{"id":"https://openalex.org/keywords/predicate","display_name":"Predicate (mathematical logic)","score":0.4074000120162964},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.38089999556541443}],"concepts":[{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.7832000255584717},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6822999715805054},{"id":"https://openalex.org/C161821725","wikidata":"https://www.wikidata.org/wiki/Q917415","display_name":"Regression testing","level":5,"score":0.5418999791145325},{"id":"https://openalex.org/C148027188","wikidata":"https://www.wikidata.org/wiki/Q907375","display_name":"Unit testing","level":3,"score":0.5375999808311462},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.5105000138282776},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4431999921798706},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.41819998621940613},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.4178999960422516},{"id":"https://openalex.org/C140146324","wikidata":"https://www.wikidata.org/wiki/Q1144319","display_name":"Predicate (mathematical logic)","level":2,"score":0.4074000120162964},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.38089999556541443},{"id":"https://openalex.org/C128942645","wikidata":"https://www.wikidata.org/wiki/Q1568346","display_name":"Test case","level":3,"score":0.37059998512268066},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.36719998717308044},{"id":"https://openalex.org/C2984328558","wikidata":"https://www.wikidata.org/wiki/Q188522","display_name":"Software testing","level":3,"score":0.35989999771118164},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.33500000834465027},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.3165000081062317},{"id":"https://openalex.org/C2994232186","wikidata":"https://www.wikidata.org/wiki/Q50324608","display_name":"World class","level":2,"score":0.27649998664855957},{"id":"https://openalex.org/C162443782","wikidata":"https://www.wikidata.org/wiki/Q1066228","display_name":"White-box testing","level":5,"score":0.26989999413490295},{"id":"https://openalex.org/C164691408","wikidata":"https://www.wikidata.org/wiki/Q5071844","display_name":"Change impact analysis","level":3,"score":0.2694000005722046},{"id":"https://openalex.org/C188598960","wikidata":"https://www.wikidata.org/wiki/Q7705805","display_name":"Test strategy","level":3,"score":0.2671000063419342},{"id":"https://openalex.org/C7435765","wikidata":"https://www.wikidata.org/wiki/Q7705776","display_name":"Test Management Approach","level":5,"score":0.2669999897480011},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.25440001487731934}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/aiware69974.2025.00011","is_oa":false,"landing_page_url":"https://doi.org/10.1109/aiware69974.2025.00011","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 2nd IEEE/ACM International Conference on AI-powered Software (AIware)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1965194038","https://openalex.org/W1971650562","https://openalex.org/W2041713059","https://openalex.org/W2122205205","https://openalex.org/W2156723666","https://openalex.org/W2167271913","https://openalex.org/W2888080919","https://openalex.org/W3005628256","https://openalex.org/W3086938529","https://openalex.org/W3098391866","https://openalex.org/W4284681867","https://openalex.org/W4284690374","https://openalex.org/W4296394699","https://openalex.org/W4384155677","https://openalex.org/W4385301323","https://openalex.org/W4385473722","https://openalex.org/W4389104713","https://openalex.org/W4391974543","https://openalex.org/W4400484796","https://openalex.org/W4400582872","https://openalex.org/W4400978763","https://openalex.org/W4401906817","https://openalex.org/W4403186335","https://openalex.org/W4403536268","https://openalex.org/W4403538008","https://openalex.org/W4404783393","https://openalex.org/W4405441291","https://openalex.org/W4406798194","https://openalex.org/W4406867742","https://openalex.org/W4409495141","https://openalex.org/W4410537837","https://openalex.org/W4411449794","https://openalex.org/W4415746277","https://openalex.org/W4415746319"],"related_works":[],"abstract_inverted_index":{"Automated":[0],"unit":[1],"test":[2,73,109],"generation":[3,144],"aims":[4],"to":[5,71],"improve":[6],"software":[7,87,113],"quality":[8,128],"while":[9],"reducing":[10],"the":[11,30,34,42,45,55,103,127,137,146],"time":[12],"and":[13,89,121,139,155],"effort":[14],"required":[15],"for":[16],"creating":[17],"tests":[18],"manually.":[19],"However,":[20],"existing":[21],"techniques":[22],"primarily":[23],"generate":[24,72],"regression":[25],"oracles":[26,74,110],"that":[27,75,111],"predicate":[28],"on":[29,102],"implemented":[31],"behavior":[32],"of":[33,47,57,84,105,123,129,141,152],"class":[35],"under":[36],"test.":[37],"They":[38],"do":[39],"not":[40],"address":[41],"oracle":[43,143],"problem:":[44],"challenge":[46],"distinguishing":[48],"correct":[49],"from":[50],"incorrect":[51],"program":[52],"behavior.":[53,78],"With":[54],"rise":[56],"Foundation":[58],"Models":[59,64],"(FMs),":[60],"particularly":[61],"Large":[62],"Language":[63],"(LLMs),":[65],"there":[66],"is":[67],"a":[68],"new":[69],"opportunity":[70],"reflect":[76],"intended":[77],"This":[79,96],"positions":[80],"LLMs":[81,106],"as":[82],"enablers":[83],"Promptware,":[85],"where":[86],"creation":[88],"testing":[90],"are":[91],"driven":[92],"by":[93],"natural-language":[94],"prompts.":[95],"paper":[97],"presents":[98],"an":[99],"empirical":[100],"study":[101],"effectiveness":[104],"in":[107,145,159],"generating":[108],"expose":[112],"failures.":[114],"We":[115],"investigate":[116],"how":[117],"different":[118],"prompting":[119],"strategies":[120],"levels":[122],"contextual":[124],"input":[125],"impact":[126],"LLM-generated":[130],"oracles.":[131],"Our":[132],"findings":[133],"offer":[134],"insights":[135],"into":[136],"strengths":[138],"limitations":[140],"LLM-based":[142],"FM":[147],"era,":[148],"improving":[149],"our":[150],"understanding":[151],"their":[153],"capabilities":[154],"fostering":[156],"future":[157],"research":[158],"this":[160],"area.":[161]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2026-01-21T00:00:00"}
