{"id":"https://openalex.org/W2339184484","doi":"https://doi.org/10.1145/2872427.2882981","title":"N-gram over Context","display_name":"N-gram over Context","publication_year":2016,"publication_date":"2016-04-11","ids":{"openalex":"https://openalex.org/W2339184484","doi":"https://doi.org/10.1145/2872427.2882981","mag":"2339184484"},"language":"en","primary_location":{"id":"doi:10.1145/2872427.2882981","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2872427.2882981","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 25th International Conference on World Wide Web","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070142351","display_name":"Noriaki Kawamae","orcid":"https://orcid.org/0000-0002-0746-9624"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Noriaki Kawamae","raw_affiliation_strings":["NTT Comware, Chiba, Japan"],"affiliations":[{"raw_affiliation_string":"NTT Comware, Chiba, Japan","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5070142351"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7139,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.88586227,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1045","last_page":"1055"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/gram","display_name":"Gram","score":0.6092544794082642},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.596348226070404},{"id":"https://openalex.org/keywords/n-gram","display_name":"n-gram","score":0.5834430456161499},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5530784130096436},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.15616923570632935},{"id":"https://openalex.org/keywords/history","display_name":"History","score":0.08608436584472656},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.08344605565071106}],"concepts":[{"id":"https://openalex.org/C161369605","wikidata":"https://www.wikidata.org/wiki/Q41803","display_name":"Gram","level":3,"score":0.6092544794082642},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.596348226070404},{"id":"https://openalex.org/C117884012","wikidata":"https://www.wikidata.org/wiki/Q94489","display_name":"n-gram","level":3,"score":0.5834430456161499},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5530784130096436},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.15616923570632935},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.08608436584472656},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.08344605565071106},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C523546767","wikidata":"https://www.wikidata.org/wiki/Q10876","display_name":"Bacteria","level":2,"score":0.0},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2872427.2882981","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2872427.2882981","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 25th International Conference on World Wide Web","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.44999998807907104,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W27793324","https://openalex.org/W263845233","https://openalex.org/W1609010894","https://openalex.org/W1712618182","https://openalex.org/W1878153963","https://openalex.org/W1880262756","https://openalex.org/W1967465043","https://openalex.org/W1972444686","https://openalex.org/W1985125789","https://openalex.org/W2003899488","https://openalex.org/W2005564522","https://openalex.org/W2015706532","https://openalex.org/W2037959956","https://openalex.org/W2041517243","https://openalex.org/W2042980227","https://openalex.org/W2047756776","https://openalex.org/W2061873838","https://openalex.org/W2067002391","https://openalex.org/W2069429561","https://openalex.org/W2080972498","https://openalex.org/W2087309226","https://openalex.org/W2087863196","https://openalex.org/W2104210067","https://openalex.org/W2112971401","https://openalex.org/W2116137244","https://openalex.org/W2132827946","https://openalex.org/W2141441158","https://openalex.org/W2150286230","https://openalex.org/W2151967501","https://openalex.org/W2154099718","https://openalex.org/W2158266063","https://openalex.org/W3003241580","https://openalex.org/W6637370413","https://openalex.org/W6651763111","https://openalex.org/W6676893574"],"related_works":["https://openalex.org/W2906970013","https://openalex.org/W3126081632","https://openalex.org/W2959686711","https://openalex.org/W2747014888","https://openalex.org/W2088254117","https://openalex.org/W3033292598","https://openalex.org/W2790860321","https://openalex.org/W2955248800","https://openalex.org/W3084943335","https://openalex.org/W27703600"],"abstract_inverted_index":{"Our":[0],"proposal,":[1],"$N$-gram":[2,100],"over":[3,158],"Context":[4],"(NOC),":[5],"is":[6,179],"a":[7,18,38,56,81,93,123,127,152,162,182],"nonparametric":[8],"topic":[9,31,57,76,110,189],"model":[10,184,214],"that":[11,85,177],"aims":[12],"to":[13,24,150,167,185],"help":[14,218],"our":[15],"understanding":[16],"of":[17,40,75,83,143,219],"given":[19,94,124],"corpus,":[20],"and":[21,42,64,98,155,191,195,200],"be":[22],"applied":[23],"many":[25],"text":[26],"mining":[27],"applications.":[28],"Like":[29],"other":[30],"models,":[32,51],"NOC":[33,52,79,119,146,178],"represents":[34],"each":[35,44,144,148],"document":[36,149],"as":[37,59,66,96,181],"mixture":[39],"topics":[41,84,91],"generates":[43],"word":[45,106,137],"from":[46,92,122],"one":[47],"topic.":[48],"Unlike":[49],"these":[50,115],"focuses":[53],"on":[54,108,173],"both":[55,114,187],"structure":[58,190],"an":[60,67,220],"internal":[61],"linguistic":[62,69,116],"structure,":[63],"N-gram":[65],"external":[68],"structure.":[70],"To":[71,112],"improve":[72],"the":[73,87,136,140,188,192,217],"quality":[74],"specific":[77,202],"N-grams,":[78,194],"reveals":[80],"tree":[82,134],"captures":[86],"semantic":[88],"relationship":[89],"between":[90],"corpus":[95,125],"context,":[97],"forms":[99],"by":[101,216],"offering":[102],"power-law":[103],"distributions":[104],"for":[105],"frequencies":[107],"this":[109,132],"tree.":[111],"gain":[113],"structures":[117],"efficiently,":[118],"learns":[120],"them":[121],"in":[126,139],"unified":[128],"manner.":[129],"By":[130],"accessing":[131],"entire":[133],"at":[135],"level":[138],"generative":[141,183,213],"process":[142,206],"document,":[145],"enables":[147],"maintain":[151],"thematic":[153],"coherence":[154],"form":[156],"$N$-grams":[157],"context.":[159],"We":[160],"develop":[161],"parallelizable":[163],"inference":[164],"algorithm,":[165],"D-NOC,":[166],"support":[168],"large":[169,207],"data":[170,208],"sets.":[171],"Experiments":[172],"review":[174],"articles/papers/tweet":[175],"show":[176],"useful":[180],"discover":[186],"corresponding":[193],"well":[196],"complements":[197],"human":[198],"experts":[199],"domain":[201],"knowledge.":[203],"D-NOC":[204],"can":[205],"sets":[209],"while":[210],"preserving":[211],"full":[212],"performance,":[215],"open-source":[221],"distributed":[222],"machine":[223],"learning":[224],"framework.":[225]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
