{"id":"https://openalex.org/W4393611319","doi":"https://doi.org/10.5281/zenodo.10295081","title":"GItome: a curated dataset for README summarization","display_name":"GItome: a curated dataset for README summarization","publication_year":2023,"publication_date":"2023-12-07","ids":{"openalex":"https://openalex.org/W4393611319","doi":"https://doi.org/10.5281/zenodo.10295081"},"language":"en","primary_location":{"id":"doi:10.5281/zenodo.10295081","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.10295081","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.5281/zenodo.10295081","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044470818","display_name":"Juri Di Rocco","orcid":"https://orcid.org/0000-0002-7909-3902"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Di Rocco, Juri","raw_affiliation_strings":["Universit\u00e0 degli Studi dell'Aquila"],"raw_orcid":"https://orcid.org/0000-0002-7909-3902","affiliations":[{"raw_affiliation_string":"Universit\u00e0 degli Studi dell'Aquila","institution_ids":["https://openalex.org/I26415053"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002764716","display_name":"Davide Di Ruscio","orcid":"https://orcid.org/0000-0002-5077-6793"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Di Ruscio, Davide","raw_affiliation_strings":["Universit\u00e0 degli Studi dell'Aquila"],"raw_orcid":"https://orcid.org/0000-0002-5077-6793","affiliations":[{"raw_affiliation_string":"Universit\u00e0 degli Studi dell'Aquila","institution_ids":["https://openalex.org/I26415053"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047553297","display_name":"Claudio Di Sipio","orcid":"https://orcid.org/0000-0001-9872-9542"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Di Sipio, Claudio","raw_affiliation_strings":["University of L'Aquila"],"raw_orcid":"https://orcid.org/0000-0001-9872-9542","affiliations":[{"raw_affiliation_string":"University of L'Aquila","institution_ids":["https://openalex.org/I26415053"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094324379","display_name":"Nguyen Phuong Than","orcid":null},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Phuong Than, Nguyen","raw_affiliation_strings":["University of L'Aquila"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of L'Aquila","institution_ids":["https://openalex.org/I26415053"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061119465","display_name":"Riccardo Rubei","orcid":"https://orcid.org/0000-0001-9622-5949"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Riccardo, Rubei","raw_affiliation_strings":["University of L'Aquila"],"raw_orcid":"https://orcid.org/0000-0001-9622-5949","affiliations":[{"raw_affiliation_string":"University of L'Aquila","institution_ids":["https://openalex.org/I26415053"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9829999804496765,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.953499972820282,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.9214872121810913},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5144679546356201},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.36666592955589294}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.9214872121810913},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5144679546356201},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.36666592955589294}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5281/zenodo.10295081","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.10295081","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"doi:10.5281/zenodo.10295081","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.10295081","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W2091301346","https://openalex.org/W3148229873","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W1517524280","https://openalex.org/W4323520239","https://openalex.org/W2351187795"],"abstract_inverted_index":{"About":[0],"This":[1],"repository":[2],"contains":[3,68,80,93,103],"the":[4,11,16,19,69,75,81,84,87,94,104],"source":[5],"code":[6],"implementation":[7],"used":[8,97],"to":[9,18,98],"replicate":[10],"experimental":[12],"results":[13],"obtained":[14,72],"in":[15],"submitted":[17],"21st":[20],"International":[21],"Conference":[22],"on":[23],"Mining":[24],"Software":[25],"Repositories":[26],"(MSR204).":[27],"\"GItome:":[28],"a":[29],"curated":[30],"dataset":[31,61,71],"for":[32,108],"README":[33,76],"summarization\"":[34],"authored":[35],"by:":[36],"Juri":[37],"Di":[38,41,44],"Rocco,":[39],"Davide":[40],"Ruscio,":[42],"Claudio":[43],"Sipio,":[45],"Phuong":[46],"Than":[47],"Nguyen":[48],"and":[49],"Riccardo":[50],"Rubei":[51],"(1)":[52],"Universit\u00e0":[53],"degli":[54],"Studi":[55],"dell'Aquila,":[56],"Italy":[57],"Data":[58],"description":[59],"The":[60],"is":[62],"structured":[63],"as":[64],"follows:":[65],"output_dataset.zip:":[66],"It":[67,79,92,102],"benchmarking":[70],"by":[73],"parsing":[74],"files":[77],"gitome_repo.txt:":[78],"list":[82,105],"of":[83,86,106],"URLs":[85],"considered":[88,110],"GitHub":[89],"repositories":[90,107],"existing_dumps.zip:":[91],"existing":[95],"datasets":[96,111],"build":[99],"Gitome":[100],"repository_lists.txt:":[101],"each":[109],"(with":[112],"possible":[113],"duplicates)":[114]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
