{"id":"https://openalex.org/W4411960814","doi":"https://doi.org/10.1007/s10270-025-01305-1","title":"Repeat, reorder, rephrase: data augmentation for process information extraction","display_name":"Repeat, reorder, rephrase: data augmentation for process information extraction","publication_year":2025,"publication_date":"2025-07-02","ids":{"openalex":"https://openalex.org/W4411960814","doi":"https://doi.org/10.1007/s10270-025-01305-1"},"language":"en","primary_location":{"id":"doi:10.1007/s10270-025-01305-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10270-025-01305-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10270-025-01305-1.pdf","source":{"id":"https://openalex.org/S64245694","display_name":"Software & Systems Modeling","issn_l":"1619-1366","issn":["1619-1366","1619-1374"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Software and Systems Modeling","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10270-025-01305-1.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016710529","display_name":"Julian Neuberger","orcid":"https://orcid.org/0009-0008-4244-7659"},"institutions":[{"id":"https://openalex.org/I54009628","display_name":"University of Bayreuth","ror":"https://ror.org/0234wmv40","country_code":"DE","type":"education","lineage":["https://openalex.org/I54009628"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Julian Neuberger","raw_affiliation_strings":["University of Bayreuth, Universit\u00e4tsstra\u00dfe 30, Bayreuth, Germany"],"raw_orcid":"https://orcid.org/0009-0008-4244-7659","affiliations":[{"raw_affiliation_string":"University of Bayreuth, Universit\u00e4tsstra\u00dfe 30, Bayreuth, Germany","institution_ids":["https://openalex.org/I54009628"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074762375","display_name":"Lars Ackermann","orcid":"https://orcid.org/0000-0002-6785-8998"},"institutions":[{"id":"https://openalex.org/I4210138088","display_name":"Hof University of Applied Sciences","ror":"https://ror.org/04q5vv384","country_code":"DE","type":"education","lineage":["https://openalex.org/I4210138088"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Lars Ackermann","raw_affiliation_strings":["Hof University of Applied Sciences, Alfons-Goppel-Platz 1, Hof, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hof University of Applied Sciences, Alfons-Goppel-Platz 1, Hof, Germany","institution_ids":["https://openalex.org/I4210138088"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110717736","display_name":"Stefan Jablonski","orcid":null},"institutions":[{"id":"https://openalex.org/I54009628","display_name":"University of Bayreuth","ror":"https://ror.org/0234wmv40","country_code":"DE","type":"education","lineage":["https://openalex.org/I54009628"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Stefan Jablonski","raw_affiliation_strings":["University of Bayreuth, Universit\u00e4tsstra\u00dfe 30, Bayreuth, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Bayreuth, Universit\u00e4tsstra\u00dfe 30, Bayreuth, Germany","institution_ids":["https://openalex.org/I54009628"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5016710529"],"corresponding_institution_ids":["https://openalex.org/I54009628"],"apc_list":{"value":2290,"currency":"EUR","value_usd":2890},"apc_paid":{"value":2290,"currency":"EUR","value_usd":2890},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.26403634,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"25","issue":"2","first_page":"329","last_page":"350"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10703","display_name":"Business Process Modeling and Analysis","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10703","display_name":"Business Process Modeling and Analysis","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9865000247955322,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5665071606636047},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5374809503555298},{"id":"https://openalex.org/keywords/data-extraction","display_name":"Data extraction","score":0.4977422058582306},{"id":"https://openalex.org/keywords/extraction","display_name":"Extraction (chemistry)","score":0.42788925766944885},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.33046215772628784},{"id":"https://openalex.org/keywords/medline","display_name":"MEDLINE","score":0.1543915569782257},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10416248440742493},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.09844914078712463},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.07734397053718567},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.05325084924697876}],"concepts":[{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5665071606636047},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5374809503555298},{"id":"https://openalex.org/C2777466982","wikidata":"https://www.wikidata.org/wiki/Q5227287","display_name":"Data extraction","level":3,"score":0.4977422058582306},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.42788925766944885},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33046215772628784},{"id":"https://openalex.org/C2779473830","wikidata":"https://www.wikidata.org/wiki/Q1540899","display_name":"MEDLINE","level":2,"score":0.1543915569782257},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10416248440742493},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.09844914078712463},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.07734397053718567},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.05325084924697876},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s10270-025-01305-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10270-025-01305-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10270-025-01305-1.pdf","source":{"id":"https://openalex.org/S64245694","display_name":"Software & Systems Modeling","issn_l":"1619-1366","issn":["1619-1366","1619-1374"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Software and Systems Modeling","raw_type":"journal-article"},{"id":"pmh:doi:10.15495/epub_ubt_00008922","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":{"id":"doi:10.1007/s10270-025-01305-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10270-025-01305-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10270-025-01305-1.pdf","source":{"id":"https://openalex.org/S64245694","display_name":"Software & Systems Modeling","issn_l":"1619-1366","issn":["1619-1366","1619-1374"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Software and Systems Modeling","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F5728949745","display_name":"Universit\u00e4t Bayreuth","ror":"https://ror.org/0234wmv40"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4411960814.pdf","grobid_xml":"https://content.openalex.org/works/W4411960814.grobid-xml"},"referenced_works_count":34,"referenced_works":["https://openalex.org/W207431025","https://openalex.org/W1981276685","https://openalex.org/W2081580037","https://openalex.org/W2118714763","https://openalex.org/W2539781702","https://openalex.org/W2617290256","https://openalex.org/W2947164866","https://openalex.org/W2949676527","https://openalex.org/W2952179106","https://openalex.org/W2954996726","https://openalex.org/W3021503072","https://openalex.org/W3083217792","https://openalex.org/W3096986424","https://openalex.org/W3166194309","https://openalex.org/W3173975877","https://openalex.org/W3175864158","https://openalex.org/W3211708814","https://openalex.org/W4246726178","https://openalex.org/W4291127651","https://openalex.org/W4312911974","https://openalex.org/W4319877694","https://openalex.org/W4323903886","https://openalex.org/W4379659873","https://openalex.org/W4379798775","https://openalex.org/W4386321037","https://openalex.org/W4387904842","https://openalex.org/W4390694561","https://openalex.org/W4392781032","https://openalex.org/W4396713940","https://openalex.org/W4399195425","https://openalex.org/W4401023707","https://openalex.org/W4403793823","https://openalex.org/W4405579999","https://openalex.org/W6702248584"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Abstract":[0],"Automatic":[1],"retrieval":[2,36],"of":[3,28,44,77,85,112,130,141,148,162,182,211],"formal":[4],"business":[5,78],"process":[6,79,149,171],"models":[7],"from":[8,158,224],"their":[9],"natural":[10,163],"language":[11,63,164],"descriptions":[12],"is":[13,38,71,93,100],"a":[14,26,128],"well-established":[15],"way":[16],"to":[17,88,106,170],"facilitate":[18],"the":[19,75,94,139,146,159,176,201],"time-":[20],"and":[21,33,110,174,186,226,248],"cost-intensive":[22],"modeling":[23],"procedure.":[24],"Yet,":[25],"lack":[27],"data":[29,131,143,155,178,193],"usable":[30],"for":[31,138,220,235,250],"developing":[32],"training":[34],"new":[35],"methods":[37,54],"impeding":[39],"progress":[40],"in":[41,74,119,145,180,196,200],"this":[42,124],"field":[43,161],"research.":[45],"This":[46],"issue":[47],"can":[48],"be":[49,89],"overcome":[50],"by":[51,115],"either":[52],"using":[53],"less":[55],"reliant":[56],"on":[57],"high-quality":[58],"data,":[59],"such":[60],"as":[61],"large":[62],"models,":[64],"or":[65],"creating":[66],"bigger":[67],"datasets.":[68],"The":[69],"latter":[70],"often":[72,167],"preferable":[73],"context":[76,147],"modeling,":[80],"especially":[81],"when":[82],"internal":[83],"workflows":[84],"organizations":[86],"have":[87],"treated":[90],"confidentially.":[91],"It":[92],"more":[95],"data-intensive":[96],"solution,":[97],"though,":[98],"which":[99,134],"costly.":[101],"Data":[102],"augmentation":[103,132,156,194],"techniques":[104,157],"aim":[105],"improve":[107],"both":[108],"quality":[109,144],"quantity":[111],"existing":[113],"datasets,":[114],"deliberate":[116],"perturbations":[117],"resulting":[118,177],"new,":[120],"synthetic":[121],"data.":[122],"In":[123,190],"article,":[125],"we":[126],"present":[127],"collection":[129],"techniques,":[133],"are":[135,166],"specifically":[136],"selected":[137],"task":[140],"improving":[142],"information":[150,172],"extraction.":[151],"We":[152,241],"show":[153],"why":[154],"wider":[160],"processing":[165],"not":[168],"applicable":[169],"extraction,":[173],"how":[175],"differ":[179],"terms":[181],"linguistic":[183],"variety,":[184],"structure,":[185],"feature":[187],"space":[188],"coverage.":[189],"our":[191,251],"experiments,":[192],"results":[195,249],"an":[197],"absolute":[198],"improvement":[199],"$$F_1$$":[202],"<mml:math":[203,213,228],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\">":[204,214,229],"<mml:msub>":[205],"<mml:mi>F</mml:mi>":[206],"<mml:mn>1</mml:mn>":[207],"</mml:msub>":[208],"</mml:math>":[209,219,234],"measure":[210],"$$5.7\\%$$":[212],"<mml:mrow>":[215,230],"<mml:mn>5.7</mml:mn>":[216],"<mml:mo>%</mml:mo>":[217,232],"</mml:mrow>":[218,233],"extracting":[221,236],"process-relevant":[222],"entities":[223],"text":[225],"$$4.5\\%$$":[227],"<mml:mn>4.5</mml:mn>":[231],"relations":[237],"between":[238],"those":[239],"entities.":[240],"make":[242],"all":[243],"code":[244],"available":[245],"at":[246,253],"https://github.com/JulianNeuberger/pet-data-augmentation":[247],"experiments":[252],"https://zenodo.org/doi/10.5281/zenodo.10941423":[254],".":[255]},"counts_by_year":[],"updated_date":"2026-03-18T06:27:02.140700","created_date":"2025-10-10T00:00:00"}
