{"id":"https://openalex.org/W4284697472","doi":"https://doi.org/10.1145/3477495.3531712","title":"CODEC: Complex Document and Entity Collection","display_name":"CODEC: Complex Document and Entity Collection","publication_year":2022,"publication_date":"2022-07-06","ids":{"openalex":"https://openalex.org/W4284697472","doi":"https://doi.org/10.1145/3477495.3531712"},"language":"en","primary_location":{"id":"doi:10.1145/3477495.3531712","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3477495.3531712","pdf_url":null,"source":{"id":"https://openalex.org/S4363608773","display_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://eprints.gla.ac.uk/269440/1/269440.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085187522","display_name":"Iain Mackie","orcid":"https://orcid.org/0000-0002-9690-9854"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Iain Mackie","raw_affiliation_strings":["University of Glasgow, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044013117","display_name":"Paul Owoicho","orcid":"https://orcid.org/0000-0001-5811-8050"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Paul Owoicho","raw_affiliation_strings":["University of Glasgow, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013122602","display_name":"Carlos Gemmell","orcid":"https://orcid.org/0000-0002-6730-8048"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Carlos Gemmell","raw_affiliation_strings":["University of Glasgow, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082220616","display_name":"Sophie Fischer","orcid":"https://orcid.org/0000-0002-3324-3426"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Sophie Fischer","raw_affiliation_strings":["University of Glasgow, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014199889","display_name":"Sean MacAvaney","orcid":"https://orcid.org/0000-0002-8914-2659"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Sean MacAvaney","raw_affiliation_strings":["University of Glasgow, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071842569","display_name":"Jeff Dalton","orcid":"https://orcid.org/0000-0003-2422-8651"},"institutions":[{"id":"https://openalex.org/I7882870","display_name":"University of Glasgow","ror":"https://ror.org/00vtgdb53","country_code":"GB","type":"education","lineage":["https://openalex.org/I7882870"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jeffrey Dalton","raw_affiliation_strings":["University of Glasgow, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Glasgow, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I7882870"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5085187522"],"corresponding_institution_ids":["https://openalex.org/I7882870"],"apc_list":null,"apc_paid":null,"fwci":0.6259,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.66809751,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"3067","last_page":"3077"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8571306467056274},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6714621186256409},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6347622275352478},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.6308703422546387},{"id":"https://openalex.org/keywords/codec","display_name":"Codec","score":0.601319432258606},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.5289623141288757},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.5031747221946716},{"id":"https://openalex.org/keywords/rewriting","display_name":"Rewriting","score":0.441513329744339},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.37240737676620483},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.0858745276927948}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8571306467056274},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6714621186256409},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6347622275352478},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.6308703422546387},{"id":"https://openalex.org/C161765866","wikidata":"https://www.wikidata.org/wiki/Q184748","display_name":"Codec","level":2,"score":0.601319432258606},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.5289623141288757},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.5031747221946716},{"id":"https://openalex.org/C154690210","wikidata":"https://www.wikidata.org/wiki/Q1668499","display_name":"Rewriting","level":2,"score":0.441513329744339},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.37240737676620483},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0858745276927948},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3477495.3531712","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3477495.3531712","pdf_url":null,"source":{"id":"https://openalex.org/S4363608773","display_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},{"id":"pmh:oai:eprints.gla.ac.uk:269440","is_oa":true,"landing_page_url":"https://eprints.gla.ac.uk/view/author/54266.html>,","pdf_url":"https://eprints.gla.ac.uk/269440/1/269440.pdf","source":{"id":"https://openalex.org/S4210235606","display_name":"ENLIGHTEN (Jurnal Bimbingan dan Konseling Islam)","issn_l":"2622-8912","issn":["2622-8912","2622-8920"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"}],"best_oa_location":{"id":"pmh:oai:eprints.gla.ac.uk:269440","is_oa":true,"landing_page_url":"https://eprints.gla.ac.uk/view/author/54266.html>,","pdf_url":"https://eprints.gla.ac.uk/269440/1/269440.pdf","source":{"id":"https://openalex.org/S4210235606","display_name":"ENLIGHTEN (Jurnal Bimbingan dan Konseling Islam)","issn_l":"2622-8912","issn":["2622-8912","2622-8920"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1703974055","display_name":null,"funder_award_id":"2019 Research Grant","funder_id":"https://openalex.org/F4320309327","funder_display_name":"Google"},{"id":"https://openalex.org/G1721869620","display_name":null,"funder_award_id":"2019 Data Science Research Grant","funder_id":"https://openalex.org/F4320307921","funder_display_name":"Bloomberg L.P."},{"id":"https://openalex.org/G1934935867","display_name":null,"funder_award_id":"Engineering and Physical Sciences R","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G3203412108","display_name":"Turing AI Fellowship:Neural Conversational Information Seeking Assistant","funder_award_id":"EP/V025708/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G7302224536","display_name":null,"funder_award_id":"EP/V025708/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320307921","display_name":"Bloomberg L.P.","ror":"https://ror.org/02rdpzb15"},{"id":"https://openalex.org/F4320309327","display_name":"Google","ror":"https://ror.org/00njsd438"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4284697472.pdf","grobid_xml":"https://content.openalex.org/works/W4284697472.grobid-xml"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W1990190154","https://openalex.org/W2000246295","https://openalex.org/W2000411838","https://openalex.org/W2011329312","https://openalex.org/W2059166475","https://openalex.org/W2098700435","https://openalex.org/W2117473841","https://openalex.org/W2710956079","https://openalex.org/W2740492458","https://openalex.org/W2807291761","https://openalex.org/W2883671141","https://openalex.org/W2940927814","https://openalex.org/W2955701345","https://openalex.org/W2975063679","https://openalex.org/W3021397474","https://openalex.org/W3093655911","https://openalex.org/W3094231056","https://openalex.org/W3100107515","https://openalex.org/W3102286003","https://openalex.org/W3102937497","https://openalex.org/W3133594109","https://openalex.org/W3152736451","https://openalex.org/W3152887675","https://openalex.org/W3156166379","https://openalex.org/W3169283738","https://openalex.org/W3180230246","https://openalex.org/W3201233724","https://openalex.org/W3217485291","https://openalex.org/W4221150501","https://openalex.org/W4251326898","https://openalex.org/W4365799947"],"related_works":["https://openalex.org/W2120204135","https://openalex.org/W2139396251","https://openalex.org/W1796293478","https://openalex.org/W1577544887","https://openalex.org/W2168276503","https://openalex.org/W1573537275","https://openalex.org/W2105713543","https://openalex.org/W174435416","https://openalex.org/W2132239740","https://openalex.org/W3204937561"],"abstract_inverted_index":{"CODEC":[0,34],"is":[1],"a":[2,42],"document":[3],"and":[4,41,61,69,86],"entity":[5,51],"ranking":[6],"benchmark":[7],"that":[8],"focuses":[9],"on":[10,58],"complex":[11],"research":[12],"topics.":[13],"We":[14],"target":[15],"essay-style":[16],"information":[17],"needs":[18],"of":[19],"social":[20],"science":[21],"researchers,":[22],"i.e.":[23],"\"How":[24],"has":[25],"the":[26],"UK's":[27],"Open":[28],"Banking":[29],"Regulation":[30],"benefited":[31],"Challenger":[32],"Banks\".":[33],"includes":[35,55],"42":[36],"topics":[37],"developed":[38],"by":[39],"researchers":[40],"new":[43],"focused":[44],"web":[45],"corpus":[46],"with":[47],"semantic":[48],"annotations":[49],"including":[50],"links.":[52],"This":[53],"resource":[54],"expert":[56],"judgments":[57],"17,509":[59],"documents":[60],"entities":[62],"(416.9":[63],"per":[64],"topic)":[65],"from":[66],"diverse":[67],"automatic":[68,87],"interactive":[70],"manual":[71,74],"runs.":[72],"The":[73],"runs":[75],"include":[76],"387":[77],"query":[78,83],"reformulations,":[79],"providing":[80],"data":[81],"for":[82],"performance":[84],"prediction":[85],"rewriting":[88],"evaluation.":[89]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
