{"id":"https://openalex.org/W4404088721","doi":"https://doi.org/10.48550/arxiv.2410.15509","title":"Exploring Curriculum Learning for Vision-Language Tasks: A Study on Small-Scale Multimodal Training","display_name":"Exploring Curriculum Learning for Vision-Language Tasks: A Study on Small-Scale Multimodal Training","publication_year":2024,"publication_date":"2024-10-20","ids":{"openalex":"https://openalex.org/W4404088721","doi":"https://doi.org/10.48550/arxiv.2410.15509"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2410.15509","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.15509","pdf_url":"https://arxiv.org/pdf/2410.15509","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2410.15509","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054410152","display_name":"Rohan Saha","orcid":"https://orcid.org/0000-0001-9747-0057"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Saha, Rohan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5098954215","display_name":"Abrar Fahim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fahim, Abrar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085831385","display_name":"Alona Fyshe","orcid":"https://orcid.org/0000-0003-4367-0306"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fyshe, Alona","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5087343469","display_name":"A. St. J. Murphy","orcid":"https://orcid.org/0000-0001-8337-4427"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Murphy, Alex","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5054410152"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13071","display_name":"Digital Storytelling and Education","score":0.8871999979019165,"subfield":{"id":"https://openalex.org/subfields/3616","display_name":"Speech and Hearing"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T13071","display_name":"Digital Storytelling and Education","score":0.8871999979019165,"subfield":{"id":"https://openalex.org/subfields/3616","display_name":"Speech and Hearing"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T14516","display_name":"English Language Learning and Teaching","score":0.8366000056266785,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.6703276038169861},{"id":"https://openalex.org/keywords/curriculum","display_name":"Curriculum","score":0.6608314514160156},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5845173597335815},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5256741642951965},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4171852171421051},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.3914872705936432},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35098689794540405},{"id":"https://openalex.org/keywords/pedagogy","display_name":"Pedagogy","score":0.19646039605140686},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.08681279420852661},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.0857362151145935}],"concepts":[{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.6703276038169861},{"id":"https://openalex.org/C47177190","wikidata":"https://www.wikidata.org/wiki/Q207137","display_name":"Curriculum","level":2,"score":0.6608314514160156},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5845173597335815},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5256741642951965},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4171852171421051},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3914872705936432},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35098689794540405},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.19646039605140686},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.08681279420852661},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.0857362151145935},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2410.15509","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.15509","pdf_url":"https://arxiv.org/pdf/2410.15509","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2410.15509","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2410.15509","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2410.15509","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.15509","pdf_url":"https://arxiv.org/pdf/2410.15509","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4404088721.pdf","grobid_xml":"https://content.openalex.org/works/W4404088721.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W230091440","https://openalex.org/W2233261550","https://openalex.org/W2810751659","https://openalex.org/W258997015","https://openalex.org/W2997094352","https://openalex.org/W3216976533","https://openalex.org/W100620283","https://openalex.org/W2495260952","https://openalex.org/W4366179611","https://openalex.org/W2996078371"],"abstract_inverted_index":{"For":[0],"specialized":[1],"domains,":[2],"there":[3],"is":[4],"often":[5],"not":[6],"a":[7,39,50,93,109],"wealth":[8],"of":[9,58,89,104,115,119,146],"data":[10,22,46,111],"with":[11,33,182],"which":[12],"to":[13,30,49,64,84,179,199],"train":[14],"large":[15],"machine":[16,79],"learning":[17,67,73,80,160,166,177],"models.":[18],"In":[19],"such":[20,35,204],"limited":[21,110],"/":[23,61],"compute":[24],"settings,":[25],"various":[26],"methods":[27],"exist":[28],"aiming":[29],"$\\textit{do":[31],"more":[32],"less}$,":[34],"as":[36,45,113,198],"finetuning":[37],"from":[38,71],"pretrained":[40],"model,":[41],"modulating":[42],"difficulty":[43],"levels":[44],"are":[47],"presented":[48],"model":[51,59,134],"(curriculum":[52],"learning),":[53],"and":[54,140,151,195],"considering":[55,75],"the":[56,86,102,116,120],"role":[57,103],"type":[60],"size.":[62],"Approaches":[63],"efficient":[65],"$\\textit{machine}$":[66],"also":[68],"take":[69],"inspiration":[70],"$\\textit{human}$":[72],"by":[74,92],"use":[76],"cases":[77],"where":[78],"systems":[81],"have":[82],"access":[83],"approximately":[85],"same":[87],"number":[88],"words":[90],"experienced":[91],"13":[94],"year":[95],"old":[96],"child":[97],"(100M":[98],"words).":[99],"We":[100,123,136,156,187],"investigate":[101],"3":[105],"primary":[106],"variables":[107,139],"in":[108],"regime":[112],"part":[114],"multimodal":[117,149,162],"track":[118],"BabyLM":[121],"challenge.":[122],"contrast:":[124],"(i)":[125],"curriculum":[126,159,176],"learning,":[127],"(ii),":[128],"pretraining":[129],"(with":[130],"text-only":[131,171,174],"data),":[132],"(iii)":[133],"type.":[135],"modulate":[137],"these":[138],"assess":[141],"them":[142],"on":[143,192],"two":[144],"types":[145],"tasks:":[147],"(a)":[148],"(text+image),":[150],"(b)":[152],"unimodal":[153],"(text-only)":[154],"tasks.":[155],"find":[157],"that":[158],"benefits":[161],"evaluations":[163],"over":[164],"non-curriclum":[165],"models,":[167],"particularly":[168],"when":[169],"combining":[170],"pretraining.":[172],"On":[173],"tasks,":[175],"appears":[178],"help":[180],"models":[181],"smaller":[183],"trainable":[184],"parameter":[185],"counts.":[186],"suggest":[188],"possible":[189],"reasons":[190],"based":[191],"architectural":[193],"differences":[194],"training":[196],"designs":[197],"why":[200],"one":[201],"might":[202],"observe":[203],"results.":[205]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
