{"id":"https://openalex.org/W2147057843","doi":"https://doi.org/10.1145/1571941.1571981","title":"Building enriched document representations using aggregated anchor text","display_name":"Building enriched document representations using aggregated anchor text","publication_year":2009,"publication_date":"2009-07-19","ids":{"openalex":"https://openalex.org/W2147057843","doi":"https://doi.org/10.1145/1571941.1571981","mag":"2147057843"},"language":"en","primary_location":{"id":"doi:10.1145/1571941.1571981","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1571941.1571981","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd international ACM SIGIR conference on Research and development in information retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000115067","display_name":"Donald Metzler","orcid":"https://orcid.org/0000-0003-4276-6269"},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Donald Metzler","raw_affiliation_strings":["Yahoo! Labs, Santa Clara, CA, USA","Yahoo! Labs., Santa Clara, CA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Yahoo! Labs, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Labs., Santa Clara, CA, USA#TAB#","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040195075","display_name":"Jasmine Novak","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jasmine Novak","raw_affiliation_strings":["Yahoo! Labs, Santa Clara, CA, USA","Yahoo! Labs., Santa Clara, CA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Yahoo! Labs, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Labs., Santa Clara, CA, USA#TAB#","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110375654","display_name":"Hang Cui","orcid":"https://orcid.org/0000-0002-0987-3743"},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hang Cui","raw_affiliation_strings":["Yahoo! Labs, Santa Clara, CA, USA","Yahoo! Labs., Santa Clara, CA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Yahoo! Labs, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Labs., Santa Clara, CA, USA#TAB#","institution_ids":["https://openalex.org/I4210134091"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103551629","display_name":"Srihari Reddy","orcid":null},"institutions":[{"id":"https://openalex.org/I4210134091","display_name":"Yahoo (United States)","ror":"https://ror.org/040dkzz12","country_code":"US","type":"company","lineage":["https://openalex.org/I4210134091"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Srihari Reddy","raw_affiliation_strings":["Yahoo! Labs, Santa Clara, CA, USA","Yahoo! Labs., Santa Clara, CA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Yahoo! Labs, Santa Clara, CA, USA","institution_ids":["https://openalex.org/I4210134091"]},{"raw_affiliation_string":"Yahoo! Labs., Santa Clara, CA, USA#TAB#","institution_ids":["https://openalex.org/I4210134091"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5000115067"],"corresponding_institution_ids":["https://openalex.org/I4210134091"],"apc_list":null,"apc_paid":null,"fwci":25.618,"has_fulltext":false,"cited_by_count":65,"citation_normalized_percentile":{"value":0.99404158,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"219","last_page":"226"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hyperlink","display_name":"Hyperlink","score":0.8623765707015991},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8157120943069458},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.7041497826576233},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5343913435935974},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5298057794570923},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4847145080566406},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.47722938656806946},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.46049028635025024},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.41515469551086426},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1858171820640564},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.12299981713294983}],"concepts":[{"id":"https://openalex.org/C30088001","wikidata":"https://www.wikidata.org/wiki/Q102014","display_name":"Hyperlink","level":3,"score":0.8623765707015991},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8157120943069458},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.7041497826576233},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5343913435935974},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5298057794570923},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4847145080566406},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.47722938656806946},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.46049028635025024},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.41515469551086426},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1858171820640564},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.12299981713294983},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1571941.1571981","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1571941.1571981","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd international ACM SIGIR conference on Research and development in information retrieval","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.152.4053","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.152.4053","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://ciir.cs.umass.edu/~metzler/fp094-metzler.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6499999761581421}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W60779023","https://openalex.org/W131411689","https://openalex.org/W179016587","https://openalex.org/W1984681168","https://openalex.org/W2014415866","https://openalex.org/W2027445772","https://openalex.org/W2047221353","https://openalex.org/W2060494110","https://openalex.org/W2066636486","https://openalex.org/W2067802667","https://openalex.org/W2069870183","https://openalex.org/W2070740689","https://openalex.org/W2077122984","https://openalex.org/W2078396654","https://openalex.org/W2083745421","https://openalex.org/W2085030399","https://openalex.org/W2087818911","https://openalex.org/W2089199911","https://openalex.org/W2096772800","https://openalex.org/W2108652674","https://openalex.org/W2114811871","https://openalex.org/W2124658502","https://openalex.org/W2129971563","https://openalex.org/W2130395434","https://openalex.org/W2138621811","https://openalex.org/W2143331230","https://openalex.org/W2146907956","https://openalex.org/W2147872511","https://openalex.org/W2154884126","https://openalex.org/W2158201212","https://openalex.org/W2162432120","https://openalex.org/W2175110005","https://openalex.org/W2221667243","https://openalex.org/W2496948131","https://openalex.org/W6602511761","https://openalex.org/W6603897584","https://openalex.org/W6605300326","https://openalex.org/W6669996083"],"related_works":["https://openalex.org/W2245616560","https://openalex.org/W2351804282","https://openalex.org/W2048998278","https://openalex.org/W1556894713","https://openalex.org/W2382071381","https://openalex.org/W1490416172","https://openalex.org/W158130761","https://openalex.org/W2588706232","https://openalex.org/W2096877906","https://openalex.org/W2351292080"],"abstract_inverted_index":{"It":[0,29],"is":[1,30],"well":[2],"known":[3],"that":[4,83],"anchor":[5,44,73,81,99],"text":[6,45,74,82,100],"plays":[7],"a":[8,12,35,69,102,111],"critical":[9],"role":[10],"in":[11],"variety":[13],"of":[14,42],"search":[15,114],"tasks":[16],"performed":[17],"over":[18],"hypertextual":[19],"domains,":[20],"including":[21],"enterprise":[22],"search,":[23,25],"wiki":[24],"and":[26],"web":[27,113],"search.":[28],"common":[31],"practice":[32],"to":[33,95],"enrich":[34],"document's":[36],"standard":[37],"textual":[38],"representation":[39],"with":[40,47,60,80],"all":[41],"the":[43,88,120],"associated":[46],"its":[48],"incoming":[49],"hyperlinks.":[50],"However,":[51],"this":[52,65],"approach":[53,109,121],"does":[54],"not":[55],"help":[56],"match":[57],"relevant":[58],"pages":[59],"very":[61],"few":[62],"inlinks.":[63],"In":[64],"paper,":[66],"we":[67],"propose":[68],"method":[70],"for":[71,127],"overcoming":[72],"sparsity":[75],"by":[76],"enriching":[77],"document":[78],"representations":[79],"has":[84],"been":[85],"aggregated":[86],"across":[87],"hyperlink":[89],"graph.":[90],"This":[91],"aggregation":[92],"mechanism":[93],"acts":[94],"smooth,":[96],"or":[97],"diffuse,":[98],"within":[101],"domain.":[103],"We":[104],"rigorously":[105],"evaluate":[106],"our":[107],"proposed":[108],"on":[110],"large":[112],"test":[115],"collection.":[116],"Our":[117],"results":[118],"show":[119],"significantly":[122],"improves":[123],"retrieval":[124],"effectiveness,":[125],"especially":[126],"longer,":[128],"more":[129],"difficult":[130],"queries.":[131]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":6},{"year":2014,"cited_by_count":5},{"year":2013,"cited_by_count":6},{"year":2012,"cited_by_count":10}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
