{"id":"https://openalex.org/W4404987633","doi":"https://doi.org/10.48550/arxiv.2411.15004","title":"ScribeAgent: Towards Specialized Web Agents Using Production-Scale Workflow Data","display_name":"ScribeAgent: Towards Specialized Web Agents Using Production-Scale Workflow Data","publication_year":2024,"publication_date":"2024-11-22","ids":{"openalex":"https://openalex.org/W4404987633","doi":"https://doi.org/10.48550/arxiv.2411.15004"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2411.15004","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.15004","pdf_url":"https://arxiv.org/pdf/2411.15004","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2411.15004","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036843433","display_name":"Jun-Hong Shen","orcid":"https://orcid.org/0000-0002-6220-096X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Shen, Junhong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100879246","display_name":"Atishay Jain","orcid":"https://orcid.org/0009-0004-6868-3490"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jain, Atishay","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029281644","display_name":"Zhiguang Xiao","orcid":"https://orcid.org/0000-0001-6908-8897"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Zedian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114987867","display_name":"Ishan Amlekar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Amlekar, Ishan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114987868","display_name":"Mouad Hadji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hadji, Mouad","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114987869","display_name":"Aaron Podolny","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Podolny, Aaron","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5029768722","display_name":"Ameet Talwalkar","orcid":"https://orcid.org/0000-0001-6650-1893"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Talwalkar, Ameet","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5036843433"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10703","display_name":"Business Process Modeling and Analysis","score":0.9663000106811523,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.9419999718666077,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.8184124231338501},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.6230384707450867},{"id":"https://openalex.org/keywords/production","display_name":"Production (economics)","score":0.6011964678764343},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5377566814422607},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.4784453213214874},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3649742603302002},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.08652585744857788},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.05686727166175842},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.05236083269119263}],"concepts":[{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.8184124231338501},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.6230384707450867},{"id":"https://openalex.org/C2778348673","wikidata":"https://www.wikidata.org/wiki/Q739302","display_name":"Production (economics)","level":2,"score":0.6011964678764343},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5377566814422607},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.4784453213214874},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3649742603302002},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.08652585744857788},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.05686727166175842},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.05236083269119263},{"id":"https://openalex.org/C139719470","wikidata":"https://www.wikidata.org/wiki/Q39680","display_name":"Macroeconomics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2411.15004","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.15004","pdf_url":"https://arxiv.org/pdf/2411.15004","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2411.15004","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2411.15004","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2411.15004","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.15004","pdf_url":"https://arxiv.org/pdf/2411.15004","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4404987633.pdf","grobid_xml":"https://content.openalex.org/works/W4404987633.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W1981780420","https://openalex.org/W2182707996","https://openalex.org/W45233828","https://openalex.org/W2964988449","https://openalex.org/W2397952901","https://openalex.org/W2029380707","https://openalex.org/W188202134","https://openalex.org/W4255934811","https://openalex.org/W2394416426"],"abstract_inverted_index":{"Large":[0],"Language":[1],"Model":[2],"(LLM)":[3],"agents":[4,17,91,118],"are":[5,39],"rapidly":[6],"improving":[7],"to":[8,31,43,77],"handle":[9],"increasingly":[10],"complex":[11],"web-based":[12],"tasks.":[13],"Most":[14],"of":[15,145],"these":[16],"rely":[18],"on":[19,27,92,102,119,127],"general-purpose,":[20],"proprietary":[21],"models":[22],"like":[23],"GPT-4":[24],"and":[25,51,104,132,143],"focus":[26],"designing":[28],"better":[29],"prompts":[30],"improve":[32],"their":[33],"planning":[34],"abilities.":[35],"However,":[36],"general-purpose":[37],"LLMs":[38,66],"not":[40],"specifically":[41],"trained":[42],"understand":[44],"specialized":[45],"web":[46,117],"contexts":[47],"such":[48],"as":[49],"HTML,":[50],"they":[52],"often":[53],"struggle":[54],"with":[55],"long-horizon":[56],"planning.":[57],"We":[58,121],"explore":[59],"an":[60],"alternative":[61],"approach":[62,85],"that":[63],"fine-tunes":[64],"open-source":[65],"using":[67],"production-scale":[68],"workflow":[69],"data":[70],"collected":[71],"from":[72],"over":[73,89,112],"250":[74],"domains":[75],"corresponding":[76],"6":[78],"billion":[79],"tokens.":[80],"This":[81],"simple":[82],"yet":[83],"effective":[84],"shows":[86],"substantial":[87],"gains":[88],"prompting-based":[90],"existing":[93],"benchmarks":[94],"--":[95],"ScribeAgent":[96],"achieves":[97],"state-of-the-art":[98],"direct":[99],"generation":[100],"performance":[101],"Mind2Web":[103],"improves":[105],"the":[106,113],"task":[107],"success":[108],"rate":[109],"by":[110],"7.3%":[111],"previous":[114],"best":[115],"text-only":[116],"WebArena.":[120],"further":[122],"perform":[123],"detailed":[124],"ablation":[125],"studies":[126],"various":[128],"fine-tuning":[129],"design":[130],"choices":[131],"provide":[133],"insights":[134],"into":[135],"LLM":[136],"selection,":[137],"training":[138],"recipes,":[139],"context":[140],"window":[141],"optimization,":[142],"effect":[144],"dataset":[146],"sizes.":[147]},"counts_by_year":[],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2024-12-04T00:00:00"}
