{"id":"https://openalex.org/W6893003303","doi":"https://doi.org/10.5281/zenodo.13362647","title":"Recursiveness in Multimodal Generative Artificial Intelligence","display_name":"Recursiveness in Multimodal Generative Artificial Intelligence","publication_year":2024,"publication_date":"2024-08-22","ids":{"openalex":"https://openalex.org/W6893003303","doi":"https://doi.org/10.5281/zenodo.13362647"},"language":"en","primary_location":{"id":"doi:10.5281/zenodo.13362647","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.13362647","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.5281/zenodo.13362647","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Javier, Conde","orcid":"https://orcid.org/0000-0002-5304-0626"},"institutions":[{"id":"https://openalex.org/I88060688","display_name":"Universidad Polit\u00e9cnica de Madrid","ror":"https://ror.org/03n6nwv02","country_code":"ES","type":"education","lineage":["https://openalex.org/I88060688"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Javier, Conde","raw_affiliation_strings":["Universidad Polit\u00e9cnica de Madrid"],"affiliations":[{"raw_affiliation_string":"Universidad Polit\u00e9cnica de Madrid","institution_ids":["https://openalex.org/I88060688"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Tobias, Cheung","orcid":null},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Tobias, Cheung","raw_affiliation_strings":["University of Edinburgh"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Gonzalo, Mart\u00ednez","orcid":"https://orcid.org/0000-0002-9125-6225"},"institutions":[{"id":"https://openalex.org/I50357001","display_name":"Universidad Carlos III de Madrid","ror":"https://ror.org/03ths8210","country_code":"ES","type":"education","lineage":["https://openalex.org/I50357001"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Gonzalo, Mart\u00ednez","raw_affiliation_strings":["Universidad Carlos III de Madrid"],"affiliations":[{"raw_affiliation_string":"Universidad Carlos III de Madrid","institution_ids":["https://openalex.org/I50357001"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Pedro, Reviriego","orcid":"https://orcid.org/0000-0003-2540-5234"},"institutions":[{"id":"https://openalex.org/I88060688","display_name":"Universidad Polit\u00e9cnica de Madrid","ror":"https://ror.org/03n6nwv02","country_code":"ES","type":"education","lineage":["https://openalex.org/I88060688"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Pedro, Reviriego","raw_affiliation_strings":["Universidad Polit\u00e9cnica de Madrid"],"affiliations":[{"raw_affiliation_string":"Universidad Polit\u00e9cnica de Madrid","institution_ids":["https://openalex.org/I88060688"]}]},{"author_position":"last","author":{"id":null,"display_name":"Rik, Sarkar","orcid":"https://orcid.org/0000-0001-7804-4351"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Rik, Sarkar","raw_affiliation_strings":["University of Edinburgh"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I88060688"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":null,"topics":[],"keywords":[{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.534600019454956},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.4893999993801117},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4706000089645386},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.43849998712539673},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.391400009393692},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.37940001487731934},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.36079999804496765}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7353000044822693},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6958000063896179},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.534600019454956},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.4893999993801117},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4706000089645386},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.43849998712539673},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.391400009393692},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.37940001487731934},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.36079999804496765},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3580999970436096},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.31209999322891235},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.3109000027179718},{"id":"https://openalex.org/C21780288","wikidata":"https://www.wikidata.org/wiki/Q5139731","display_name":"Coco","level":2,"score":0.3001999855041504},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.2922999858856201},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.25540000200271606},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.25}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5281/zenodo.13362647","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.13362647","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"doi:10.5281/zenodo.13362647","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.13362647","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,33,58],"dataset":[1,8,59],"contains":[2,60,73],"images":[3,55,71,104,120,170,174,201,239,253],"extracted":[4,22],"from":[5,23,70,118,164,238],"the":[6,14,41,44,51,54,64,76,100,103,108,142,181,200,236,242],"COCO":[7,119],"that":[9,72,145],"have":[10],"been":[11],"tested":[12],"in":[13,37],"Recursive":[15],"Modality":[16],"Changes":[17],"process:":[18],"a":[19,30,38,165],"caption":[20],"is":[21,35],"an":[24],"image":[25,167],"and":[26,49,84,99,105,147,203,269],"used":[27,47],"to":[28],"generate":[29],"new":[31],"image.":[32],"process":[34],"repeated":[36],"loop.":[39],"For":[40],"extraction":[42],"of":[43,53,62,66,75,121,126,144,180,185,191,198,210,213,220,223,230,251,259],"description":[45],"was":[46],"GPT-4o":[48],"for":[50],"generation":[52],"DALL-E3.":[56],"Description":[57],"experiments":[61,130,143,159,212,222,265],"applying":[63],"RMC":[65,91],"length":[67],"40":[68],"generations":[69],"elements":[74],"following":[77],"categories:":[78],"apples,":[79],"elephants,":[80],"fire-hydrants,":[81],"persons,":[82],"toilets,":[83],"trains.":[85],"In":[86],"total,":[87],"there":[88],"are":[89],"10":[90],"loops":[92,125],"per":[93,261],"category":[94,123,128],"(40*10*6":[95],"=":[96],"2,400":[97],"images)":[98],"comparison":[101],"between":[102],"descriptions":[106,205],"using":[107],"metrics":[109,153,190],"LPIPS":[110],"VGG,":[111],"TF-IDF,":[112,155],"BERT":[113,157],"tokenizer,":[114],"BLIP.":[115],"1_coco_dataset:":[116],"information":[117],"each":[122,127,162,192],"2_categories:":[124],"results_{category}":[129],"results_dall-e-3_hd_{style}_{category}":[131],"->":[132,140,150,161,169,172,176,189,196,207,217,234,249,257,264],"hd":[133],"(high":[134],"definition),":[135],"style":[136,244],"(vivid":[137,245],"or":[138,246],"natural)":[139,247],"all":[141,199,231,235,252],"{style}":[146],"{category}":[148,215,225,262],"results_all.xlsx":[149],"similarity":[151],"with":[152,178,241],"LPIPS,":[154],"BLIP,":[156],"aggregated":[158,208,218],"{date}_{style}_{coco_id}":[160],"experiment":[163,182],"coco":[166],"imgs":[168],"imgs_resized":[171],"resized":[173],"experiment.json":[175],"json":[177],"data":[179],"(description,":[183],"number":[184],"generations,":[186],"etc.)":[187],"results.xlsx":[188],"individual":[193],"loop":[194],"images_all.xlsx":[195,248],"summary":[197,250,258],"generated":[202,240],"their":[204],"inter-experiments_results.xlsx":[206],"results":[209,219,229,237,260],"inter-trajectory":[211],"this":[214,224],"intra-experiments_results.xlsx":[216],"intra-trajectory":[221],"3_combined":[226],"results:":[227],"combined":[228],"categories":[232],"rsults_hd_labels_{style}":[233],"same":[243],"inter-exeriments_results_all.xlsx":[254],"intra-experiments_results_all.xlsx":[255],"results_all_labels.xlsx":[256],"4_different_styles":[263],"comparing":[266],"styles":[267],"(natural":[268],"vivid)":[270],"Paper":[271],"Paper:":[272],"Cite:":[273],"@misc{}":[274]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
