{"id":"https://openalex.org/W1965906558","doi":"https://doi.org/10.1145/1008992.1009088","title":"The document as an ergodic markov chain","display_name":"The document as an ergodic markov chain","publication_year":2004,"publication_date":"2004-07-25","ids":{"openalex":"https://openalex.org/W1965906558","doi":"https://doi.org/10.1145/1008992.1009088","mag":"1965906558"},"language":"en","primary_location":{"id":"doi:10.1145/1008992.1009088","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1008992.1009088","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th annual international ACM SIGIR conference on Research and development in information retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111794960","display_name":"Eduard Hoenkamp","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114752","display_name":"Nijmegen Institute for Scientist Practitioners in Addiction","ror":"https://ror.org/01ydthg97","country_code":"NL","type":"other","lineage":["https://openalex.org/I4210114752"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Eduard Hoenkamp","raw_affiliation_strings":["Nijmegen Institute for Cognition and Information, The Netherlands"],"affiliations":[{"raw_affiliation_string":"Nijmegen Institute for Cognition and Information, The Netherlands","institution_ids":["https://openalex.org/I4210114752"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050532724","display_name":"Dawei Song","orcid":"https://orcid.org/0000-0002-8660-3608"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dawei Song","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5111794960"],"corresponding_institution_ids":["https://openalex.org/I4210114752"],"apc_list":null,"apc_paid":null,"fwci":0.4625,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.74569843,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"496","last_page":"497"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ergodic-theory","display_name":"Ergodic theory","score":0.7679276466369629},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7377973794937134},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.6058933138847351},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.5337648391723633},{"id":"https://openalex.org/keywords/joint-probability-distribution","display_name":"Joint probability distribution","score":0.5159743428230286},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5019829273223877},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4139566719532013},{"id":"https://openalex.org/keywords/probability-distribution","display_name":"Probability distribution","score":0.4121879041194916},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3750971257686615},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.32244452834129333},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.23283711075782776},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20847636461257935},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.13157129287719727},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09978687763214111}],"concepts":[{"id":"https://openalex.org/C122044880","wikidata":"https://www.wikidata.org/wiki/Q5498822","display_name":"Ergodic theory","level":2,"score":0.7679276466369629},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7377973794937134},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.6058933138847351},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.5337648391723633},{"id":"https://openalex.org/C18653775","wikidata":"https://www.wikidata.org/wiki/Q1333358","display_name":"Joint probability distribution","level":2,"score":0.5159743428230286},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5019829273223877},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4139566719532013},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.4121879041194916},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3750971257686615},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.32244452834129333},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.23283711075782776},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20847636461257935},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.13157129287719727},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09978687763214111},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/1008992.1009088","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1008992.1009088","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th annual international ACM SIGIR conference on Research and development in information retrieval","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.96.7003","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.96.7003","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://kmi.open.ac.uk/people/dawei/papers/hoenkamp-song-sigir04.pdf","raw_type":"text"},{"id":"pmh:oai:espace.library.uq.edu.au:UQ:22283d8","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306402388","display_name":"Queensland's institutional digital repository (The University of Queensland)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I165143802","host_organization_name":"The University of Queensland","host_organization_lineage":["https://openalex.org/I165143802"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"},{"id":"pmh:ru:oai:repository.ubn.ru.nl:2066/64542","is_oa":false,"landing_page_url":"http://hdl.handle.net/2066/64542","pdf_url":null,"source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Proceedings 27th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, 496 - 497. New York : ACM Press","raw_type":"info:eu-repo/semantics/bookpart"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W1482214997","https://openalex.org/W2008480878","https://openalex.org/W2068905009","https://openalex.org/W2154344566","https://openalex.org/W4243333943","https://openalex.org/W4300973511"],"related_works":["https://openalex.org/W2379651310","https://openalex.org/W1987264987","https://openalex.org/W2113019827","https://openalex.org/W1541249122","https://openalex.org/W2951801950","https://openalex.org/W4297670780","https://openalex.org/W2413828414","https://openalex.org/W1482189126","https://openalex.org/W2367222340","https://openalex.org/W2122857041"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"statistical":[3],"language":[4,19,113],"models":[5,36],"are":[6],"being":[7],"proposed":[8],"as":[9,18,39],"alternative":[10],"to":[11,59],"the":[12,22,31,40,68,85,99,102,105],"vector":[13],"space":[14],"model.":[15],"Viewing":[16],"documents":[17],"samples":[20],"introduces":[21],"issue":[23],"of":[24,42,104],"defining":[25],"a":[26,37,43,109],"joint":[27,69],"probability":[28],"distribution":[29,70],"over":[30],"terms.":[32],"The":[33,63],"present":[34],"paper":[35],"document":[38,86],"result":[41,65],"Markov":[44],"process.":[45],"It":[46],"argues":[47],"that":[48,67],"this":[49,90],"process":[50],"is":[51,54,66],"ergodic,":[52],"which":[53],"theoretically":[55],"plausible,":[56],"and":[57,101],"easy":[58],"verify":[60],"in":[61,91],"practice.":[62],"theoretical":[64],"can":[71,76],"be":[72,78],"easily":[73],"obtained.":[74],"This":[75,107],"also":[77],"applied":[79],"for":[80,111],"search":[81],"resolutions":[82],"other":[83],"than":[84],"level.":[87],"We":[88],"verified":[89],"an":[92],"experiment":[93],"on":[94],"query":[95],"expansion":[96],"demonstrating":[97],"both":[98],"validity":[100],"practicability":[103],"method.":[106],"holds":[108],"promise":[110],"general":[112],"models.":[114]},"counts_by_year":[{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
