{"id":"https://openalex.org/W7125124111","doi":"https://doi.org/10.48550/arxiv.2601.11647","title":"Reinforcement Learning for Dynamic Workflow Optimization in CI/CD Pipelines","display_name":"Reinforcement Learning for Dynamic Workflow Optimization in CI/CD Pipelines","publication_year":2026,"publication_date":"2026-01-15","ids":{"openalex":"https://openalex.org/W7125124111","doi":"https://doi.org/10.48550/arxiv.2601.11647"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.11647","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.11647","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.11647","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040634542","display_name":"Arun Soni","orcid":"https://orcid.org/0000-0001-8593-3229"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Soni, Aniket Abhishek","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123528531","display_name":"Milan Parikh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parikh, Milan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5117774578","display_name":"Rashi Nimesh Kumar Dhenia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dhenia, Rashi Nimesh Kumar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123534869","display_name":"Jubin Abhishek Soni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Soni, Jubin Abhishek","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123473935","display_name":"Ayush Raj Jha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jha, Ayush Raj","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5123489547","display_name":"Sneja Mitinbhai Shah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shah, Sneja Mitinbhai","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5040634542"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.29679998755455017,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.29679998755455017,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.20730000734329224,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10639","display_name":"Advanced Software Engineering Methodologies","score":0.06790000200271606,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8669000267982483},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7840999960899353},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.6796000003814697},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.6514000296592712},{"id":"https://openalex.org/keywords/devops","display_name":"DevOps","score":0.6035000085830688},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.5652999877929688},{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.5651999711990356},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.4948999881744385}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8669000267982483},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7840999960899353},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7242000102996826},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.6796000003814697},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.6514000296592712},{"id":"https://openalex.org/C9903902","wikidata":"https://www.wikidata.org/wiki/Q3025536","display_name":"DevOps","level":3,"score":0.6035000085830688},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.5652999877929688},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.5651999711990356},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.4948999881744385},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.46059998869895935},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.37380000948905945},{"id":"https://openalex.org/C128942645","wikidata":"https://www.wikidata.org/wiki/Q1568346","display_name":"Test case","level":3,"score":0.36970001459121704},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.35760000348091125},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.34290000796318054},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.30959999561309814},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.30300000309944153},{"id":"https://openalex.org/C80519477","wikidata":"https://www.wikidata.org/wiki/Q3532236","display_name":"Scenario testing","level":3,"score":0.29420000314712524},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.28929999470710754},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2806999981403351},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.27399998903274536},{"id":"https://openalex.org/C2778820799","wikidata":"https://www.wikidata.org/wiki/Q3454688","display_name":"Cost reduction","level":2,"score":0.2583000063896179},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25200000405311584}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.11647","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.11647","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.11647","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.11647","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Responsible consumption and production","score":0.4359267055988312,"id":"https://metadata.un.org/sdg/12"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Continuous":[0,3],"Integration":[1],"and":[2,47,89,109,164,176],"Deployment":[4],"(CI/CD)":[5],"pipelines":[6],"are":[7],"central":[8],"to":[9,32,53,68,82,102,120,135,161],"modern":[10],"software":[11],"delivery,":[12],"yet":[13],"their":[14],"static":[15,121],"workflows":[16],"often":[17],"introduce":[18],"inefficiencies":[19],"as":[20,42,58],"systems":[21],"scale.":[22],"This":[23],"paper":[24],"proposes":[25],"a":[26,43,103,111,125,169],"reinforcement":[27,159],"learning":[28,160],"(RL)":[29],"based":[30],"approach":[31,85],"dynamically":[33],"optimize":[34],"CI/CD":[35,77,178],"pipeline":[36,39,99],"workflows.":[37],"The":[38,132],"is":[40,51,80],"modeled":[41],"Markov":[44],"Decision":[45],"Process,":[46],"an":[48],"RL":[49,97],"agent":[50,133],"trained":[52],"make":[54],"runtime":[55],"decisions":[56],"such":[57],"selecting":[59],"full,":[60],"partial,":[61],"or":[62,138],"no":[63],"test":[64,116],"execution":[65,117],"in":[66,107,115],"order":[67],"maximize":[69],"throughput":[70,108],"while":[71,123],"minimizing":[72],"testing":[73],"overhead.":[74],"A":[75],"configurable":[76],"simulation":[78],"environment":[79],"developed":[81],"evaluate":[83],"the":[84,96,156],"across":[86],"build,":[87],"test,":[88],"deploy":[90],"stages.":[91],"Experimental":[92],"results":[93,154],"show":[94],"that":[95],"optimized":[98],"achieves":[100],"up":[101],"30":[104],"percent":[105,113],"improvement":[106],"approximately":[110],"25":[112],"reduction":[114],"time":[118],"compared":[119],"baselines,":[122],"maintaining":[124],"defect":[126],"miss":[127],"rate":[128],"below":[129],"5":[130],"percent.":[131],"learns":[134],"selectively":[136],"skip":[137],"abbreviate":[139],"tests":[140],"for":[141],"low":[142],"risk":[143],"commits,":[144],"accelerating":[145],"feedback":[146],"cycles":[147],"without":[148],"significantly":[149],"increasing":[150],"failure":[151],"risk.":[152],"These":[153],"demonstrate":[155],"potential":[157],"of":[158],"enable":[162],"adaptive":[163],"intelligent":[165],"DevOps":[166],"workflows,":[167],"providing":[168],"practical":[170],"pathway":[171],"toward":[172],"more":[173],"efficient,":[174],"resilient,":[175],"sustainable":[177],"automation.":[179]},"counts_by_year":[],"updated_date":"2026-01-22T23:33:04.759266","created_date":"2026-01-22T00:00:00"}
