{"id":"https://openalex.org/W2136530748","doi":"https://doi.org/10.1177/0165551511415183","title":"A prediction model for web search hit counts using word frequencies","display_name":"A prediction model for web search hit counts using word frequencies","publication_year":2011,"publication_date":"2011-07-29","ids":{"openalex":"https://openalex.org/W2136530748","doi":"https://doi.org/10.1177/0165551511415183","mag":"2136530748"},"language":"en","primary_location":{"id":"doi:10.1177/0165551511415183","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551511415183","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100419134","display_name":"Tian Tian","orcid":"https://orcid.org/0000-0002-9021-7996"},"institutions":[{"id":"https://openalex.org/I118118575","display_name":"New Jersey Institute of Technology","ror":"https://ror.org/05e74xb87","country_code":"US","type":"education","lineage":["https://openalex.org/I118118575"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tian Tian","raw_affiliation_strings":["New Jersey Institute of Technology, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"New Jersey Institute of Technology, USA","institution_ids":["https://openalex.org/I118118575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036705478","display_name":"Soon Ae Chun","orcid":null},"institutions":[{"id":"https://openalex.org/I174216632","display_name":"City University of New York","ror":"https://ror.org/00453a208","country_code":"US","type":"education","lineage":["https://openalex.org/I174216632"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Soon Ae Chun","raw_affiliation_strings":["City University of New York, USA","CITY UNIVERSITY OF NEW YORK, USA,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"City University of New York, USA","institution_ids":["https://openalex.org/I174216632"]},{"raw_affiliation_string":"CITY UNIVERSITY OF NEW YORK, USA,","institution_ids":["https://openalex.org/I174216632"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070654032","display_name":"James Geller","orcid":"https://orcid.org/0000-0002-9120-525X"},"institutions":[{"id":"https://openalex.org/I118118575","display_name":"New Jersey Institute of Technology","ror":"https://ror.org/05e74xb87","country_code":"US","type":"education","lineage":["https://openalex.org/I118118575"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"James Geller","raw_affiliation_strings":["New Jersey Institute of Technology, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"New Jersey Institute of Technology, USA","institution_ids":["https://openalex.org/I118118575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100419134"],"corresponding_institution_ids":["https://openalex.org/I118118575"],"apc_list":null,"apc_paid":null,"fwci":0.7639,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.84116059,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"37","issue":"5","first_page":"462","last_page":"475"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13976","display_name":"Web visibility and informetrics","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9825999736785889,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7998969554901123},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.7910147309303284},{"id":"https://openalex.org/keywords/web-search-query","display_name":"Web search query","score":0.7191485166549683},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.7167112827301025},{"id":"https://openalex.org/keywords/search-analytics","display_name":"Search analytics","score":0.5195111036300659},{"id":"https://openalex.org/keywords/metasearch-engine","display_name":"Metasearch engine","score":0.5077751278877258},{"id":"https://openalex.org/keywords/online-search","display_name":"Online search","score":0.48919156193733215},{"id":"https://openalex.org/keywords/web-search-engine","display_name":"Web search engine","score":0.46869516372680664},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4565112888813019},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.43447020649909973},{"id":"https://openalex.org/keywords/semantic-search","display_name":"Semantic search","score":0.4222361445426941},{"id":"https://openalex.org/keywords/web-query-classification","display_name":"Web query classification","score":0.4212181568145752},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34784531593322754},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08452323079109192}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7998969554901123},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.7910147309303284},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.7191485166549683},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.7167112827301025},{"id":"https://openalex.org/C14838553","wikidata":"https://www.wikidata.org/wiki/Q7441639","display_name":"Search analytics","level":4,"score":0.5195111036300659},{"id":"https://openalex.org/C173979980","wikidata":"https://www.wikidata.org/wiki/Q114106","display_name":"Metasearch engine","level":4,"score":0.5077751278877258},{"id":"https://openalex.org/C171089853","wikidata":"https://www.wikidata.org/wiki/Q7094123","display_name":"Online search","level":2,"score":0.48919156193733215},{"id":"https://openalex.org/C521815418","wikidata":"https://www.wikidata.org/wiki/Q4182287","display_name":"Web search engine","level":4,"score":0.46869516372680664},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4565112888813019},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.43447020649909973},{"id":"https://openalex.org/C166423231","wikidata":"https://www.wikidata.org/wiki/Q1891170","display_name":"Semantic search","level":3,"score":0.4222361445426941},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.4212181568145752},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34784531593322754},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08452323079109192},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/0165551511415183","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551511415183","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W1410460","https://openalex.org/W48178473","https://openalex.org/W82021493","https://openalex.org/W148019605","https://openalex.org/W187070286","https://openalex.org/W563169923","https://openalex.org/W594521162","https://openalex.org/W1500720541","https://openalex.org/W1501882636","https://openalex.org/W1509699184","https://openalex.org/W1560709708","https://openalex.org/W1570448133","https://openalex.org/W1604007790","https://openalex.org/W1636492622","https://openalex.org/W1662723021","https://openalex.org/W1865453863","https://openalex.org/W1880247114","https://openalex.org/W1928755576","https://openalex.org/W1994151493","https://openalex.org/W1997612355","https://openalex.org/W2032253055","https://openalex.org/W2037959956","https://openalex.org/W2046725473","https://openalex.org/W2053782355","https://openalex.org/W2073002952","https://openalex.org/W2079656678","https://openalex.org/W2095368471","https://openalex.org/W2099437808","https://openalex.org/W2103052078","https://openalex.org/W2107972503","https://openalex.org/W2112888549","https://openalex.org/W2121494450","https://openalex.org/W2122946987","https://openalex.org/W2124416056","https://openalex.org/W2128941908","https://openalex.org/W2133322356","https://openalex.org/W2136583886","https://openalex.org/W2142233082","https://openalex.org/W2158606791","https://openalex.org/W2169598467","https://openalex.org/W2171970775","https://openalex.org/W2346435300","https://openalex.org/W2618567416","https://openalex.org/W2966207845","https://openalex.org/W3013264884","https://openalex.org/W4235015211","https://openalex.org/W4248184695","https://openalex.org/W4250708312","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W4206776910","https://openalex.org/W2262062475","https://openalex.org/W2183410680","https://openalex.org/W2154792254","https://openalex.org/W4256136669","https://openalex.org/W2115429408","https://openalex.org/W2538203441","https://openalex.org/W1132511467","https://openalex.org/W2186487484","https://openalex.org/W2136530748"],"abstract_inverted_index":{"A":[0],"search":[1,30,96,115,126,142,158,172,182],"engine":[2,97],"user":[3],"with":[4],"a":[5,18,75,86,130],"well-defined":[6],"information":[7],"need":[8,32],"is":[9],"not":[10],"interested":[11],"in":[12,113],"getting":[13],"thousands":[14,63],"of":[15,67,95,110,125,149],"hits,":[16],"but":[17],"few":[19],"hits":[20,54,98],"that":[21],"are":[22],"all":[23],"highly":[24],"relevant":[25,43],"to":[26,33,38,41,52,62,139],"their":[27],"search.":[28],"Often":[29],"words":[31,112],"be":[34,137],"refined":[35],"and":[36,84,163,170,180],"augmented":[37],"narrow":[39],"results":[40],"more":[42],"pages.":[44],"However,":[45],"an":[46,146],"overly":[47],"specific":[48],"query":[49,76,82,102,134],"may":[50],"lead":[51,61],"no":[53],"at":[55],"all,":[56],"while":[57],"most":[58],"typical":[59],"queries":[60],"or":[64],"even":[65],"millions":[66],"them,":[68],"both":[69],"undesirable":[70],"outcomes.":[71],"This":[72],"paper":[73],"suggests":[74],"rewriting":[77],"method":[78],"for":[79,91,99,155],"generating":[80],"alternative":[81,101],"strings":[83],"proposes":[85],"hit":[87,119,132,151],"count":[88,120,133,152],"prediction":[89,121,153],"model":[90,154],"predicting":[92],"the":[93,106,111,114,118,150,167],"number":[94],"each":[100],"string,":[103],"based":[104],"on":[105],"English":[107],"language":[108],"frequencies":[109],"terms.":[116],"Using":[117],"model,":[122],"different":[123],"types":[124],"strategies,":[127],"such":[128],"as":[129],"lowest":[131],"preference,":[135],"can":[136],"utilized":[138],"improve":[140],"users\u2019":[141],"experience.":[143],"We":[144,160],"present":[145],"evaluation":[147],"experiment":[148],"three":[156],"major":[157],"engines.":[159],"also":[161],"discuss":[162],"quantify":[164],"how":[165],"far":[166],"Google,":[168],"Yahoo!":[169],"Bing":[171],"engines":[173],"diverge":[174],"from":[175],"monotonic":[176],"behaviour,":[177],"considering":[178],"negative":[179],"positive":[181],"terms":[183],"separately.":[184]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2015,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2026-05-05T06:06:40.768181","created_date":"2025-10-10T00:00:00"}
