{"id":"https://openalex.org/W7117683005","doi":"https://doi.org/10.5281/zenodo.18098507","title":"Replication package for the paper: \"Datasets, Bias, Licenses, and Terms of Use: A Large and Longitudinal Study on the Documentation of Hugging Face Machine Learning Models\"","display_name":"Replication package for the paper: \"Datasets, Bias, Licenses, and Terms of Use: A Large and Longitudinal Study on the Documentation of Hugging Face Machine Learning Models\"","publication_year":2025,"publication_date":"2025-12-30","ids":{"openalex":"https://openalex.org/W7117683005","doi":"https://doi.org/10.5281/zenodo.18098507"},"language":null,"primary_location":{"id":"doi:10.5281/zenodo.18098507","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.18098507","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.5281/zenodo.18098507","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121668053","display_name":"Federica Pepe","orcid":null},"institutions":[{"id":"https://openalex.org/I16337185","display_name":"University of Sannio","ror":"https://ror.org/04vc81p87","country_code":"IT","type":"education","lineage":["https://openalex.org/I16337185"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Pepe, Federica","raw_affiliation_strings":["University of Sannio"],"raw_orcid":"https://orcid.org/0009-0008-3038-3977","affiliations":[{"raw_affiliation_string":"University of Sannio","institution_ids":["https://openalex.org/I16337185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042772226","display_name":"Vittoria Nardone","orcid":"https://orcid.org/0000-0001-7888-6620"},"institutions":[{"id":"https://openalex.org/I129627893","display_name":"University of Molise","ror":"https://ror.org/04z08z627","country_code":"IT","type":"education","lineage":["https://openalex.org/I129627893"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Nardone, Vittoria","raw_affiliation_strings":["University of Molise"],"raw_orcid":"https://orcid.org/0000-0001-7888-6620","affiliations":[{"raw_affiliation_string":"University of Molise","institution_ids":["https://openalex.org/I129627893"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069505458","display_name":"Antonio Mastropaolo","orcid":"https://orcid.org/0000-0002-7965-7712"},"institutions":[{"id":"https://openalex.org/I16285277","display_name":"William & Mary","ror":"https://ror.org/03hsf0573","country_code":"US","type":"education","lineage":["https://openalex.org/I16285277"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mastropaolo, Antonio","raw_affiliation_strings":["William & Mary"],"raw_orcid":"https://orcid.org/0000-0002-7965-7712","affiliations":[{"raw_affiliation_string":"William & Mary","institution_ids":["https://openalex.org/I16285277"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006915371","display_name":"Gerardo Canfora","orcid":"https://orcid.org/0000-0003-0049-1279"},"institutions":[{"id":"https://openalex.org/I16337185","display_name":"University of Sannio","ror":"https://ror.org/04vc81p87","country_code":"IT","type":"education","lineage":["https://openalex.org/I16337185"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Canfora, Gerardo","raw_affiliation_strings":["University of Sannio"],"raw_orcid":"https://orcid.org/0000-0003-0049-1279","affiliations":[{"raw_affiliation_string":"University of Sannio","institution_ids":["https://openalex.org/I16337185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056526226","display_name":"Gabriele Bavota","orcid":"https://orcid.org/0000-0002-2216-3148"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"BAVOTA, Gabriele","raw_affiliation_strings":[],"raw_orcid":"https://orcid.org/0000-0002-2216-3148","affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5025099559","display_name":"Massimiliano Di Penta","orcid":"https://orcid.org/0000-0002-0340-9747"},"institutions":[{"id":"https://openalex.org/I16337185","display_name":"University of Sannio","ror":"https://ror.org/04vc81p87","country_code":"IT","type":"education","lineage":["https://openalex.org/I16337185"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Di Penta, Massimiliano","raw_affiliation_strings":["University of Sannio"],"raw_orcid":"https://orcid.org/0000-0002-0340-9747","affiliations":[{"raw_affiliation_string":"University of Sannio","institution_ids":["https://openalex.org/I16337185"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":null,"topics":[],"keywords":[{"id":"https://openalex.org/keywords/directory","display_name":"Directory","score":0.7784000039100647},{"id":"https://openalex.org/keywords/scripting-language","display_name":"Scripting language","score":0.7425000071525574},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.6941999793052673},{"id":"https://openalex.org/keywords/snapshot","display_name":"Snapshot (computer storage)","score":0.49540001153945923},{"id":"https://openalex.org/keywords/schema","display_name":"Schema (genetic algorithms)","score":0.4377000033855438},{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.37310001254081726},{"id":"https://openalex.org/keywords/replication","display_name":"Replication (statistics)","score":0.34049999713897705},{"id":"https://openalex.org/keywords/file-format","display_name":"File format","score":0.3278999924659729}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8212000131607056},{"id":"https://openalex.org/C2777683733","wikidata":"https://www.wikidata.org/wiki/Q201456","display_name":"Directory","level":2,"score":0.7784000039100647},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.7425000071525574},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.6941999793052673},{"id":"https://openalex.org/C55282118","wikidata":"https://www.wikidata.org/wiki/Q252683","display_name":"Snapshot (computer storage)","level":2,"score":0.49540001153945923},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.45190000534057617},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.44110000133514404},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.4377000033855438},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.4221000075340271},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41440001130104065},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.37310001254081726},{"id":"https://openalex.org/C12590798","wikidata":"https://www.wikidata.org/wiki/Q3933199","display_name":"Replication (statistics)","level":2,"score":0.34049999713897705},{"id":"https://openalex.org/C97250363","wikidata":"https://www.wikidata.org/wiki/Q235557","display_name":"File format","level":2,"score":0.3278999924659729},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32710000872612},{"id":"https://openalex.org/C181177684","wikidata":"https://www.wikidata.org/wiki/Q188816","display_name":"Lightweight Directory Access Protocol","level":3,"score":0.3068000078201294},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.30300000309944153},{"id":"https://openalex.org/C171730128","wikidata":"https://www.wikidata.org/wiki/Q5227290","display_name":"Data file","level":2,"score":0.28780001401901245},{"id":"https://openalex.org/C118643609","wikidata":"https://www.wikidata.org/wiki/Q189210","display_name":"Web application","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2768000066280365},{"id":"https://openalex.org/C88006597","wikidata":"https://www.wikidata.org/wiki/Q690117","display_name":"Disk formatting","level":2,"score":0.265500009059906},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2639000117778778},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2619999945163727},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.26179999113082886},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C138708601","wikidata":"https://www.wikidata.org/wiki/Q8811","display_name":"HTML","level":3,"score":0.25600001215934753},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5281/zenodo.18098507","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.18098507","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"doi:10.5281/zenodo.18098507","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.18098507","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0],"replication":[1,592],"package":[2,593],"contains":[3,167,176,186,199,209,218,506,822,931,939,949,962,972,981],"datasets":[4,231,252,264,548,560,994,1015,1027],"and":[5,14,20,44,46,60,78,193,327,332,347,352,367,374,389,396,410,417,438,445,538,650,738,774,792,807,818,824,833,956,1090,1095],"scripts":[6,56,77,823],"related":[7,97,329,349,371,393,414,442,465,480,715,863,875,1092],"to":[8,38,58,98,204,330,350,372,394,415,443,466,481,564,575,598,695,710,716,764,826,838,864,876,967,1093],"the":[9,24,40,47,55,67,71,88,92,99,110,125,135,144,152,162,187,191,200,205,210,219,237,246,260,269,280,294,309,321,341,462,471,477,486,502,529,531,533,539,556,569,577,583,588,591,596,609,614,632,639,646,652,657,660,675,690,697,712,724,730,735,740,771,787,828,840,843,860,869,877,888,898,907,916,926,950,954,963,968,973,982,1000,1009,1023,1032,1043,1057,1072,1084],"paper:":[10],"\"Datasets,":[11],"Bias,":[12],"Licenses,":[13],"Terms":[15],"of":[16,26,120,131,140,148,158,215,221,229,234,243,256,263,268,283,297,312,317,337,379,400,422,450,461,468,476,483,492,498,513,535,541,546,552,559,571,590,616,627,656,665,669,677,679,682,689,700,747,750,754,784,797,845,852,859,866,883,894,903,912,922,978,984,992,997,1006,1019,1026,1031,1046,1060,1075,1080],"Use:":[17],"A":[18],"Large":[19],"Longitudinal":[21],"Study":[22],"on":[23],"Documentation":[25],"Hugging":[27],"Face":[28],"Machine":[29],"Learning":[30],"Models\"":[31],"root":[32,589],"directory":[33,581],"statistics.r:":[34],"R":[35],"script":[36,72,563,611,837],"used":[37,57,80,258,515,525,554,1021],"compute":[39,696,711],"correlation":[41],"between":[42,190,363,385,406,434,803,830,953],"usage":[43,168,177,360,382,403,431,507,800,932,940],"downloads,":[45],"RQ1/RQ2":[48],"inter-rater":[49,698,713],"agreements":[50],"scripts/":[51],"Directory":[52,75],"containing":[53,76,108],"all":[54,109,853],"collect":[59],"process":[61],"data.":[62],"For":[63,84],"further":[64,82,85],"details,":[65,86],"see":[66,87],"README":[68,89],"file":[69,90,107,604,694,709,727],"inside":[70,91],"directory.":[73,93],"further-analyses/":[74],"data":[79,96,825,874],"for":[81,172,181,196,259,355,424,452,470,485,522,555,568,622,659,720,760,777,868,936,944,959,1022],"analyses.":[83],"first-snaphot":[94],"Contains":[95,873],"first":[100,192,472,870,955],"snapshot":[101,195,473,488,871,958],"(ICPC":[102],"2024":[103],"study)":[104],"modelsInfo.zip:":[105],"zip":[106],"downloaded":[111],"model":[112,171,180,201,274,510,524,566,633,640,647,653,685,705,722,788,935,943,964,1037],"cards":[113,202,965],"(in":[114],"JSON":[115],"format)":[116],"Dataset":[117,489,880],"Dataset/DatasetHFmodellist.csv:":[118],"list":[119,130,139,147,157,228,233,242,316,336,491,497,545,626,844,882,893,902,911,921,991,996,1005,1079],"HF":[121,230,493,547,636,884,993],"models":[122,188,235,244,257,494,514,553,855,885,951,998,1007,1020],"analyzed,":[123,886],"with":[124,212,224,249,279,293,308,323,343,426,454,582,756,814,847,887,975,987,1012,1042,1056,1071,1086],"following":[126,889],"information:":[127,890],"id,downloads,likes,tags,pipelinetag,pipelinecategory,License,licensemodelpermissivity":[128],"Dataset/DatasetGitHubprjlistTransformers.txt:":[129],"GitHub":[132,141,149,159,499,518,527,895,904,913,923],"projects":[133,142,150,160,211,223,318,338,425,453,500,896,905,914,924,974,986,1081],"using":[134,143,151,161,501,897,906,915,925],"transformers":[136,154,173,286,503,899,918,1049],"library":[137,155,165,174,183,354,376,419,447,504,900,909,919,929,946,1097],"Dataset/DatasetGitHubprjlistDiffusers.txt:":[138],"diffuserslibrary":[145],"Dataset/DatasetGitHubprjfrompretrainedTransformers.txt:":[146],"\"frompretrained\"":[153,163],"Dataset/DatasetGitHubprjfrompretrainedDiffusers.txt:":[156],"diffusers":[164,182,301,908,928,945,1064],"Dataset/DatasetGitHubprjmodelusedTransformers.csv:":[166],"pairs:":[169,178,508,933,941],"project,":[170,179,509,934,942],"Dataset/DatasetGitHubprjmodelusedDiffusers.csv:":[175],"Dataset/DatasetIntersectedModels.csv":[184],":":[185,241,300,948,1004,1063],"shared":[189,952],"second":[194,487,878,957],"category":[197,742,960],"Dataset/modelsReadme:":[198,961],"belonging":[203,966],"sample":[206,254,550,658,749,969,1017],"size":[207,970],"Dataset/projectswith5ormorestars.csv:":[208],"numStars":[213,225,976,988],"major":[214,977],"5":[216,358,429,457,979],"Dataset/projectsstars_summary.csv:":[217],"number":[220,282,296,311,512,534,540,676,983,1045,1059,1074],"total":[222,315,335,985,1078],"RQ1":[226,543,989],"RQ1/RQ1datasetlistHF.txt:":[227],"RQ1/RQ1datasetTags.txt:":[232],"declaring":[236,245,999,1008],"dataset":[238,247,1001,1010],"tag":[239,248,773,1002,1011],"RQ1/RQ1modelDataset.csv":[240],"their":[250,324,344,815,848,1013,1087],"respective":[251,281,295,310,325,345,816,1014,1044,1058,1073,1088],"RQ1/RQ1datasetSample.csv:":[253],"set":[255,551,1018],"manual":[261,270,463,478,557,661,691,745,861,1024,1033],"analysis":[262,558,662,829,841,1025],"RQ2":[265,671,1028],"RQ2/RQ2biasclassification_sheet.csv:":[266],"results":[267,460,475,688,858,1030],"labeling":[271,464,479,692,862,1034],"RQ3":[272,743,1035],"RQ3/RQ3LicenseModels.csv:":[273],"license":[275,288,303,772,798,834,1038,1051,1066],"list,categorized":[276,1039],"by":[277,291,306,516,526,608,684,1040,1054,1069],"permissiveness,":[278,292,307,1041,1055,1070],"occurrences":[284,298,313,678,1047,1061,1076],"RQ3/RQ3LicenseprjTransformers.csv:":[285],"project":[287,302,519,762,1050,1065],"list,":[289,304,1052,1067],"categorized":[290,305,1053,1068],"RQ3/RQ3LicenseprjDiffusers.csv":[299],"RQ3/RQ3prjmodellicensepermissivityTransformersDiffusers.csv:":[314],"that":[319,339,1082],"reuse":[320,340,1083],"models,":[322,342,765,1085],"licenses":[326,346,365,369,387,391,401,408,412,436,440,451,751,755,805,809,817,846,851,1089],"permissiveness":[328,348,380,423,758,819,849,1091],"Transformers":[331,351,373,395,416,444,1094],"Diffuserslibrary":[333,397],"RQ3/RQ3prjmodellicensepermissivityTransformersDiffusersStarmajor5.csv:":[334],"Diffusers":[353,375,418,446,1096],"numStar":[356,427,455],">":[357,428,456],"RQ3/RQ3ContingencyMatrixpermissivityTransformersDiffusers.csv:":[359],"contingency":[361,383,404,432,801],"table":[362,384,405,433,673,802],"projects'":[364,386,407,435,804],"(columns)":[366,388,409,437,806],"models'":[368,390,411,439,808],"(rows)":[370,392,413,441,810],"in":[377,398,420,448,579,602,723],"terms":[378,399,421,449,467,482,865],"RQ3/RQ3ContingencyMatrixlicensesTransformersDiffusers.csv:":[381],"RQ3/RQ3ContingencyMatrixpermissivityTransformersDiffusersStarmajor5.csv:":[402],"RQ3/RQ3ContingencyMatrixlicensesTransformersDiffusers_Starmajor5.csv:":[430],"RQ4":[458,856],"RQ4/RQ4TermsofUseSnapshot1.csv:":[459],"use":[469,484,867],"RQ4/RQ4TermsofUseSnapshot2.csv:":[474],"Dataset/Dataset_HF-models-list.csv:":[490],"analyzed":[495,607,854],"Dataset/Dataset_github-prj-list.txt:":[496],"Dataset/Dataset_github-Prj_model-Used.csv:":[505],"Dataset/Dataset_prj-num-models-reused.csv:":[511],"each":[517,523,623,721,761,778],"Dataset/Dataset_model-download_num-prj_correlation.csv":[520],"contains,":[521],"projects:":[528],"name,":[530],"task,":[532],"reusing":[536],"projects,":[537],"downloads":[542],"RQ1/RQ1_dataset-list.txt:":[544],"RQ1/RQ1_datasetSample.csv:":[549,1016],"RQ1/RQ1_analyzeDatasetTags.py:":[561],"Python":[562],"analyze":[565],"tags":[567],"presence":[570],"datasets.":[572],"it":[573,769],"requires":[574],"unzip":[576],"modelsInfo.zip":[578],"a":[580,603,625,704,748,790],"same":[584],"name":[585,775],"(modelsInfo)":[586],"at":[587],"folder.":[594],"Produces":[595],"output":[597,615,664,668],"stdout.":[599],"To":[600],"redirect":[601],"fo":[605],"be":[606],"RQ2/countDataset.py":[610,670],"RQ1/RQ1_countDataset.py:":[612],"given":[613],"RQ2/analyzeDatasetTags.py":[617,666],"(passed":[618],"as":[619],"argument)":[620],"produces,":[621],"model,":[624,779],"Booleans":[628],"indicating":[629],"whether":[630,701,786],"(i)":[631,729],"only":[634,641],"declares":[635,642,648],"datasets,":[637,644],"(ii)":[638,734],"external":[643],"(iii)":[645,739],"both,":[649],"(iv)":[651],"is":[654],"part":[655],"RQ1/RQ1_datasetTags.csv:":[663],"RQ1/RQ1_dataset_usage_count.csv:":[667],"RQ2/tableBias.pdf:":[672],"detailing":[674],"different":[680,757],"types":[681,832],"bias":[683,717,731],"Task":[686],"RQ2/RQ2_bias_classification_sheet.csv:":[687,1029],"RQ2/RQ2_isBiased.csv:":[693],"agreement":[699,714],"or":[702],"not":[703],"documents":[706],"Bias":[707],"RQ2/RQ2_biasAgrLabels.csv:":[708],"categories":[718],"RQ2/RQ2_final_bias_categories_with_levels.csv:":[719],"sample,":[725],"this":[726],"lists":[728,753],"leaf":[732],"category,":[733,737],"first-level":[736],"intermediate":[741],"RQ3/RQ3_LicenseValidation.csv:":[744],"validation":[746],"RQ3/RQ3_{NETWORK-RESTRICTIVE|RESTRICTIVE|WEAK-RESTRICTIVE|PERMISSIVE}-license-list.txt:":[752],"RQ3/RQ3_prjs_license.csv:":[759],"linked":[763],"among":[766,781],"other":[767,782],"fields":[768],"indicates":[770,780],"RQ3/RQ3_models_license.csv:":[776],"pieces":[783],"info,":[785],"has":[789],"license,":[791],"if":[793],"yes":[794],"what":[795],"kind":[796],"RQ3/RQ3_model-prj-license_contingency_table.csv:":[799],"RQ3/RQ3_models_prjs_licenses_with_type.csv:":[811],"pairs":[812],"project-model,":[813],"level":[820],"RQ3/license-task-relation/:":[821],"perform":[827,839],"task":[831],"types:":[835],"analysis\\_by\\_type.py:":[836],"list.csv:":[842],"licensebytype.csv:":[850],"RQ4/RQ4_Terms_of_Use_Snapshot1.csv:":[857],"second-snaphot":[872],"snapshot.":[879],"Dataset/Dataset_HF_model_list.csv:":[881],"id,downloads,likes,tags,pipeline_tag,pipeline_category,License,license_model_permissivity":[891],"Dataset/Dataset_GitHub_prj_list_Transformers.txt:":[892],"Dataset/Dataset_GitHub_prj_list_Diffusers.txt:":[901],"Dataset/Dataset_GitHub_prj_frompretrained_Transformers.txt:":[910],"\"from_pretrained\"":[917,927],"Dataset/Dataset_GitHub_prj_frompretrained_Diffusers.txt:":[920],"Dataset/Dataset_GitHub_prj_model_used_Transformers.csv:":[930],"transformerslibrary":[937],"Dataset/Dataset_GitHub_prj_model_used_Diffusers.csv:":[938],"Dataset/Dataset_IntersectedModels.csv":[947],"Dataset/projects_with_5_or_more_stars.csv:":[971],"Dataset/projects_stars_summary.csv:":[980],"RQ1/RQ1_dataset_list_HF.txt:":[990],"RQ1/RQ1_datasetTags.txt:":[995],"RQ1/RQ1_modelDataset.csv":[1003],"RQ3/RQ3_License_Models.csv:":[1036],"RQ3/RQ3_License_prjTransformers.csv:":[1048],"RQ3/RQ3_License_prjDiffusers.csv":[1062],"RQ3/RQ3_prj_model_license_permissivity_Transformers_Diffusers.csv:":[1077],"RQ3/":[1098]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-12-31T00:00:00"}
