{"id":"https://openalex.org/W2275236596","doi":"https://doi.org/10.1145/2816815","title":"Power Law Distributions in Information Retrieval","display_name":"Power Law Distributions in Information Retrieval","publication_year":2016,"publication_date":"2016-02-16","ids":{"openalex":"https://openalex.org/W2275236596","doi":"https://doi.org/10.1145/2816815","mag":"2275236596"},"language":"en","primary_location":{"id":"doi:10.1145/2816815","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2816815","pdf_url":null,"source":{"id":"https://openalex.org/S4394735545","display_name":"ACM Transactions on Information Systems","issn_l":"1046-8188","issn":["1046-8188","1558-2868"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Information Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016676280","display_name":"Casper Petersen","orcid":"https://orcid.org/0000-0001-5858-1985"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":true,"raw_author_name":"Casper Petersen","raw_affiliation_strings":["University of Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"University of Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024664299","display_name":"Jakob Grue Simonsen","orcid":"https://orcid.org/0000-0002-3488-9392"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Jakob Grue Simonsen","raw_affiliation_strings":["University of Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"University of Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045425016","display_name":"Christina Lioma","orcid":"https://orcid.org/0000-0003-2600-2701"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Christina Lioma","raw_affiliation_strings":["University of Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"University of Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5016676280"],"corresponding_institution_ids":["https://openalex.org/I124055696"],"apc_list":null,"apc_paid":null,"fwci":5.6345,"has_fulltext":false,"cited_by_count":52,"citation_normalized_percentile":{"value":0.96235294,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"34","issue":"2","first_page":"1","last_page":"37"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/power-law","display_name":"Power law","score":0.5295575261116028},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.51873379945755},{"id":"https://openalex.org/keywords/probability-distribution","display_name":"Probability distribution","score":0.4892570972442627},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.4544009864330292},{"id":"https://openalex.org/keywords/inverse","display_name":"Inverse","score":0.4387887120246887},{"id":"https://openalex.org/keywords/frequency-distribution","display_name":"Frequency distribution","score":0.42851877212524414},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3566444516181946},{"id":"https://openalex.org/keywords/law","display_name":"Law","score":0.3563012182712555},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.2907106280326843},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10276848077774048}],"concepts":[{"id":"https://openalex.org/C87040749","wikidata":"https://www.wikidata.org/wiki/Q428971","display_name":"Power law","level":2,"score":0.5295575261116028},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.51873379945755},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.4892570972442627},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.4544009864330292},{"id":"https://openalex.org/C207467116","wikidata":"https://www.wikidata.org/wiki/Q4385666","display_name":"Inverse","level":2,"score":0.4387887120246887},{"id":"https://openalex.org/C51921466","wikidata":"https://www.wikidata.org/wiki/Q1627586","display_name":"Frequency distribution","level":2,"score":0.42851877212524414},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3566444516181946},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.3563012182712555},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.2907106280326843},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10276848077774048},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2816815","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2816815","pdf_url":null,"source":{"id":"https://openalex.org/S4394735545","display_name":"ACM Transactions on Information Systems","issn_l":"1046-8188","issn":["1046-8188","1558-2868"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Information Systems","raw_type":"journal-article"},{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/011da330-a914-4e07-81e6-6775e292e539","is_oa":false,"landing_page_url":"https://researchprofiles.ku.dk/da/publications/011da330-a914-4e07-81e6-6775e292e539","pdf_url":null,"source":{"id":"https://openalex.org/S4306401983","display_name":"Research at the University of Copenhagen (University of Copenhagen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I124055696","host_organization_name":"University of Copenhagen","host_organization_lineage":["https://openalex.org/I124055696"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Petersen , C , Simonsen , J G & Lioma , C 2016 , ' Power law distributions in information retrieval ' , A C M Transactions on Information Systems , vol. 34 , no. 2 , 8 . https://doi.org/10.1145/2816815","raw_type":"article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8199999928474426,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":169,"referenced_works":["https://openalex.org/W14235832","https://openalex.org/W36335185","https://openalex.org/W129305155","https://openalex.org/W198383996","https://openalex.org/W205142180","https://openalex.org/W258808915","https://openalex.org/W581215525","https://openalex.org/W587356381","https://openalex.org/W607600043","https://openalex.org/W1487943643","https://openalex.org/W1491360661","https://openalex.org/W1501235680","https://openalex.org/W1505031252","https://openalex.org/W1506069954","https://openalex.org/W1517590677","https://openalex.org/W1522242062","https://openalex.org/W1527463082","https://openalex.org/W1532325895","https://openalex.org/W1534381410","https://openalex.org/W1543711590","https://openalex.org/W1544520332","https://openalex.org/W1549014378","https://openalex.org/W1552247668","https://openalex.org/W1556485461","https://openalex.org/W1557301691","https://openalex.org/W1569709403","https://openalex.org/W1570233747","https://openalex.org/W1570260812","https://openalex.org/W1598342322","https://openalex.org/W1681759250","https://openalex.org/W1685426458","https://openalex.org/W1769703906","https://openalex.org/W1808298867","https://openalex.org/W1830719945","https://openalex.org/W1830805508","https://openalex.org/W1860144983","https://openalex.org/W1865446091","https://openalex.org/W1924133215","https://openalex.org/W1928047241","https://openalex.org/W1943015726","https://openalex.org/W1964154547","https://openalex.org/W1965086361","https://openalex.org/W1967674581","https://openalex.org/W1968371014","https://openalex.org/W1969721537","https://openalex.org/W1972070683","https://openalex.org/W1974339500","https://openalex.org/W1978577143","https://openalex.org/W1979313500","https://openalex.org/W1982219281","https://openalex.org/W1982314207","https://openalex.org/W1982858363","https://openalex.org/W1985672722","https://openalex.org/W1990843604","https://openalex.org/W1993803315","https://openalex.org/W1995173295","https://openalex.org/W1998559030","https://openalex.org/W1999326226","https://openalex.org/W2000042664","https://openalex.org/W2001149451","https://openalex.org/W2005311637","https://openalex.org/W2007590531","https://openalex.org/W2009435671","https://openalex.org/W2020284581","https://openalex.org/W2023214515","https://openalex.org/W2025047573","https://openalex.org/W2028904519","https://openalex.org/W2029296527","https://openalex.org/W2036671379","https://openalex.org/W2040890692","https://openalex.org/W2045638068","https://openalex.org/W2046972450","https://openalex.org/W2047008218","https://openalex.org/W2047634477","https://openalex.org/W2048076161","https://openalex.org/W2048649579","https://openalex.org/W2056144417","https://openalex.org/W2057464142","https://openalex.org/W2057571146","https://openalex.org/W2059304996","https://openalex.org/W2061069417","https://openalex.org/W2062021443","https://openalex.org/W2066180141","https://openalex.org/W2072156548","https://openalex.org/W2073766874","https://openalex.org/W2079356438","https://openalex.org/W2080066866","https://openalex.org/W2082061067","https://openalex.org/W2084862934","https://openalex.org/W2085761620","https://openalex.org/W2086378526","https://openalex.org/W2087309226","https://openalex.org/W2087692915","https://openalex.org/W2087863196","https://openalex.org/W2096290331","https://openalex.org/W2096361430","https://openalex.org/W2101196063","https://openalex.org/W2101460669","https://openalex.org/W2101846955","https://openalex.org/W2112053513","https://openalex.org/W2112948240","https://openalex.org/W2115054880","https://openalex.org/W2117325943","https://openalex.org/W2118009636","https://openalex.org/W2119485457","https://openalex.org/W2120892989","https://openalex.org/W2121821841","https://openalex.org/W2121871834","https://openalex.org/W2126863010","https://openalex.org/W2127246734","https://openalex.org/W2128442773","https://openalex.org/W2129235726","https://openalex.org/W2133953554","https://openalex.org/W2136719353","https://openalex.org/W2137924350","https://openalex.org/W2139882553","https://openalex.org/W2139940151","https://openalex.org/W2140849606","https://openalex.org/W2141499038","https://openalex.org/W2142635246","https://openalex.org/W2143070266","https://openalex.org/W2143288831","https://openalex.org/W2144211451","https://openalex.org/W2144219418","https://openalex.org/W2144885342","https://openalex.org/W2149282917","https://openalex.org/W2150937237","https://openalex.org/W2152421589","https://openalex.org/W2160160425","https://openalex.org/W2160555926","https://openalex.org/W2162541740","https://openalex.org/W2163021329","https://openalex.org/W2165071399","https://openalex.org/W2167414245","https://openalex.org/W2168175751","https://openalex.org/W2171743956","https://openalex.org/W2174008607","https://openalex.org/W2175110005","https://openalex.org/W2183266670","https://openalex.org/W2211904086","https://openalex.org/W2250837944","https://openalex.org/W2276223951","https://openalex.org/W2312217865","https://openalex.org/W2316904474","https://openalex.org/W2523688471","https://openalex.org/W2603834791","https://openalex.org/W2753666478","https://openalex.org/W2790417170","https://openalex.org/W2892038650","https://openalex.org/W2897129259","https://openalex.org/W2913252902","https://openalex.org/W2950627632","https://openalex.org/W2952193981","https://openalex.org/W3100249728","https://openalex.org/W3101452997","https://openalex.org/W3103362336","https://openalex.org/W3103786587","https://openalex.org/W3105385534","https://openalex.org/W3125811491","https://openalex.org/W4211007733","https://openalex.org/W4231934124","https://openalex.org/W4236703367","https://openalex.org/W4249962242","https://openalex.org/W4285719527","https://openalex.org/W4298432362","https://openalex.org/W4300323401","https://openalex.org/W4304686742","https://openalex.org/W4376608133","https://openalex.org/W6816317740"],"related_works":["https://openalex.org/W4317939968","https://openalex.org/W2895820280","https://openalex.org/W1987570032","https://openalex.org/W2580842864","https://openalex.org/W1964850218","https://openalex.org/W3021169926","https://openalex.org/W2123011400","https://openalex.org/W1544451817","https://openalex.org/W4236413566","https://openalex.org/W2589174435"],"abstract_inverted_index":{"Several":[0],"properties":[1,161],"of":[2,34,39,66,106,130,147,182],"information":[3],"retrieval":[4],"(IR)":[5],"data,":[6],"such":[7,40],"as":[8,21],"query":[9,89,91,142],"frequency":[10,143,150],"or":[11,46,174,204],"document":[12,87],"length,":[13,88,92],"are":[14,152,162],"widely":[15],"considered":[16],"to":[17,29,133,192,198],"be":[18,55,193],"approximately":[19],"distributed":[20],"a":[22,156],"power":[23,67,80,110,131,157,184],"law.":[24,158],"This":[25,50],"common":[26],"assumption":[27],"aims":[28],"focus":[30],"on":[31],"specific":[32],"characteristics":[33],"the":[35,63,103,128,166,180],"empirical":[36],"probability":[37,137],"distribution":[38,116,190],"data":[41],"(e.g.,":[42],"its":[43,47],"scale-free":[44],"nature":[45],"long/fat":[48],"tail).":[49],"assumption,":[51],"however,":[52],"may":[53],"not":[54],"always":[56],"true.":[57],"Motivated":[58],"by":[59,155,165,187],"recent":[60],"work":[61],"in":[62],"statistical":[64],"treatment":[65],"law":[68,81,111,185],"claims,":[69],"we":[70],"investigate":[71],"two":[72],"research":[73],"questions:":[74],"(i)":[75],"To":[76],"what":[77,101],"extent":[78],"do":[79],"approximations":[82,112,186],"hold":[83],"for":[84,208],"term":[85,149],"frequency,":[86,90,94],"citation":[93],"and":[95,122,126,144],"syntactic":[96],"unigram":[97],"frequency?":[98],"And":[99],"(ii)":[100],"is":[102],"computational":[104],"cost":[105],"replacing":[107,183],"ad":[108],"hoc":[109],"with":[113,195],"more":[114,188],"accurate":[115],"fitting?":[117],"We":[118,139,177],"study":[119],"23":[120],"TREC":[121],"5":[123,145],"non-TREC":[124],"datasets":[125],"compare":[127],"fit":[129],"laws":[132],"15":[134],"other":[135],"standard":[136],"distributions.":[138],"find":[140,179],"that":[141],"out":[146],"24":[148],"distributions":[151],"best":[153],"approximated":[154,164],"All":[159],"remaining":[160],"better":[163],"Inverse":[167],"Gaussian,":[168],"Generalized":[169],"Extreme":[170],"Value,":[171],"Negative":[172],"Binomial,":[173],"Yule":[175],"distribution.":[176],"also":[178],"overhead":[181],"informed":[189],"fitting":[191],"negligible,":[194],"potential":[196],"gains":[197],"IR":[199,209],"tasks":[200],"like":[201],"index":[202],"compression":[203],"test":[205],"collection":[206],"generation":[207],"evaluation.":[210]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":12},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":5}],"updated_date":"2026-03-15T09:29:46.208133","created_date":"2025-10-10T00:00:00"}
