{"id":"https://openalex.org/W2166183437","doi":"https://doi.org/10.1198/004017007000000245","title":"Large-Scale Bayesian Logistic Regression for Text Categorization","display_name":"Large-Scale Bayesian Logistic Regression for Text Categorization","publication_year":2007,"publication_date":"2007-07-19","ids":{"openalex":"https://openalex.org/W2166183437","doi":"https://doi.org/10.1198/004017007000000245","mag":"2166183437"},"language":"en","primary_location":{"id":"doi:10.1198/004017007000000245","is_oa":false,"landing_page_url":"https://doi.org/10.1198/004017007000000245","pdf_url":null,"source":{"id":"https://openalex.org/S985303","display_name":"Technometrics","issn_l":"0040-1706","issn":["0040-1706","1537-2723"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Technometrics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082142377","display_name":"Alexander Genkin","orcid":"https://orcid.org/0000-0002-0716-1304"},"institutions":[{"id":"https://openalex.org/I102322142","display_name":"Rutgers, The State University of New Jersey","ror":"https://ror.org/05vt9qd57","country_code":"US","type":"education","lineage":["https://openalex.org/I102322142"]},{"id":"https://openalex.org/I2799411422","display_name":"Center for Discrete Mathematics and Theoretical Computer Science","ror":"https://ror.org/00k551w06","country_code":"US","type":"facility","lineage":["https://openalex.org/I102322142","https://openalex.org/I118347220","https://openalex.org/I1283103587","https://openalex.org/I1311060795","https://openalex.org/I20089843","https://openalex.org/I2799411422","https://openalex.org/I4210107353"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Alexander Genkin","raw_affiliation_strings":["DIMACS, Rutgers University, Piscataway, NJ 08854"],"affiliations":[{"raw_affiliation_string":"DIMACS, Rutgers University, Piscataway, NJ 08854","institution_ids":["https://openalex.org/I2799411422","https://openalex.org/I102322142"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020081385","display_name":"David Lewis","orcid":"https://orcid.org/0000-0002-3503-4644"},"institutions":[{"id":"https://openalex.org/I4210148173","display_name":"Morgan, Lewis & Bockius (United States)","ror":"https://ror.org/04c0z3e83","country_code":"US","type":"company","lineage":["https://openalex.org/I4210148173"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David D Lewis","raw_affiliation_strings":["David D. Lewis Consulting, Chicago, IL 60614"],"affiliations":[{"raw_affiliation_string":"David D. Lewis Consulting, Chicago, IL 60614","institution_ids":["https://openalex.org/I4210148173"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018667469","display_name":"David Madigan","orcid":"https://orcid.org/0000-0001-9754-1011"},"institutions":[{"id":"https://openalex.org/I102322142","display_name":"Rutgers, The State University of New Jersey","ror":"https://ror.org/05vt9qd57","country_code":"US","type":"education","lineage":["https://openalex.org/I102322142"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Madigan","raw_affiliation_strings":["Dept. of Statistics, Rutgers University, Piscataway, NJ 08854"],"affiliations":[{"raw_affiliation_string":"Dept. of Statistics, Rutgers University, Piscataway, NJ 08854","institution_ids":["https://openalex.org/I102322142"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5082142377"],"corresponding_institution_ids":["https://openalex.org/I102322142","https://openalex.org/I2799411422"],"apc_list":null,"apc_paid":null,"fwci":73.9961,"has_fulltext":false,"cited_by_count":817,"citation_normalized_percentile":{"value":0.99953096,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"49","issue":"3","first_page":"291","last_page":"304"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.8020586371421814},{"id":"https://openalex.org/keywords/logistic-model-tree","display_name":"Logistic model tree","score":0.6934609413146973},{"id":"https://openalex.org/keywords/logistic-regression","display_name":"Logistic regression","score":0.6655988693237305},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6304411888122559},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5595265030860901},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.5509822964668274},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.5227689743041992},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.48806560039520264},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.47001174092292786},{"id":"https://openalex.org/keywords/multinomial-logistic-regression","display_name":"Multinomial logistic regression","score":0.42884087562561035},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.4132651090621948},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.3932819366455078},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36740702390670776},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.28257423639297485},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.07447731494903564}],"concepts":[{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.8020586371421814},{"id":"https://openalex.org/C61722155","wikidata":"https://www.wikidata.org/wiki/Q6667643","display_name":"Logistic model tree","level":3,"score":0.6934609413146973},{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.6655988693237305},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6304411888122559},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5595265030860901},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.5509822964668274},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.5227689743041992},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48806560039520264},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.47001174092292786},{"id":"https://openalex.org/C117568660","wikidata":"https://www.wikidata.org/wiki/Q1650843","display_name":"Multinomial logistic regression","level":2,"score":0.42884087562561035},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.4132651090621948},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.3932819366455078},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36740702390670776},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.28257423639297485},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.07447731494903564}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1198/004017007000000245","is_oa":false,"landing_page_url":"https://doi.org/10.1198/004017007000000245","pdf_url":null,"source":{"id":"https://openalex.org/S985303","display_name":"Technometrics","issn_l":"0040-1706","issn":["0040-1706","1537-2723"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Technometrics","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.360.5168","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.360.5168","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.stat.columbia.edu/~madigan/PAPERS/techno.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320337372","display_name":"U.S. National Library of Medicine","ror":"https://ror.org/0060t0j89"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":67,"referenced_works":["https://openalex.org/W144798229","https://openalex.org/W155555924","https://openalex.org/W182831726","https://openalex.org/W220758854","https://openalex.org/W1524688041","https://openalex.org/W1540198634","https://openalex.org/W1540550673","https://openalex.org/W1554663460","https://openalex.org/W1554944419","https://openalex.org/W1564518192","https://openalex.org/W1566768190","https://openalex.org/W1572615921","https://openalex.org/W1574901103","https://openalex.org/W1579838312","https://openalex.org/W1648445109","https://openalex.org/W1924689489","https://openalex.org/W1971289666","https://openalex.org/W1978394996","https://openalex.org/W1980922217","https://openalex.org/W1993644118","https://openalex.org/W1999974018","https://openalex.org/W2005404141","https://openalex.org/W2009190245","https://openalex.org/W2010526612","https://openalex.org/W2047028564","https://openalex.org/W2053463056","https://openalex.org/W2060216474","https://openalex.org/W2063978378","https://openalex.org/W2063993968","https://openalex.org/W2071664212","https://openalex.org/W2098162425","https://openalex.org/W2100322632","https://openalex.org/W2101095383","https://openalex.org/W2102650424","https://openalex.org/W2102667697","https://openalex.org/W2103333826","https://openalex.org/W2106393550","https://openalex.org/W2118020653","https://openalex.org/W2122825543","https://openalex.org/W2125781844","https://openalex.org/W2129049059","https://openalex.org/W2135046866","https://openalex.org/W2136052850","https://openalex.org/W2146571341","https://openalex.org/W2147598330","https://openalex.org/W2148576472","https://openalex.org/W2149684865","https://openalex.org/W2150102617","https://openalex.org/W2150579376","https://openalex.org/W2150940164","https://openalex.org/W2152734820","https://openalex.org/W2153890685","https://openalex.org/W2153962014","https://openalex.org/W2156512439","https://openalex.org/W2181650752","https://openalex.org/W2266946488","https://openalex.org/W2435251607","https://openalex.org/W2437356612","https://openalex.org/W2715880412","https://openalex.org/W2797692640","https://openalex.org/W3207007339","https://openalex.org/W4239353198","https://openalex.org/W4241931738","https://openalex.org/W4247440588","https://openalex.org/W4255455317","https://openalex.org/W4285719527","https://openalex.org/W4293902500"],"related_works":["https://openalex.org/W4295122168","https://openalex.org/W3155717344","https://openalex.org/W1770458422","https://openalex.org/W4378417285","https://openalex.org/W4246416652","https://openalex.org/W2346848267","https://openalex.org/W3164319184","https://openalex.org/W2528588360","https://openalex.org/W2494119046","https://openalex.org/W4236124836"],"abstract_inverted_index":{"Logistic":[0],"regression":[1,30,82],"analysis":[2],"of":[3,55],"high-dimensional":[4],"data,":[5],"such":[6],"as":[7,69,71],"natural":[8],"language":[9],"text,":[10],"poses":[11],"computational":[12],"and":[13,40,59,98,100],"statistical":[14],"challenges.":[15],"Maximum":[16],"likelihood":[17],"estimation":[18],"often":[19],"fails":[20],"in":[21],"these":[22],"applications.":[23],"We":[24,48,87],"present":[25],"a":[26,34,53],"simple":[27],"Bayesian":[28],"logistic":[29,81],"approach":[31,51],"that":[32,61],"uses":[33],"Laplace":[35],"prior":[36],"to":[37,52],"avoid":[38],"overfitting":[39],"produces":[41,63],"sparse":[42],"predictive":[43,65],"models":[44,66],"for":[45],"text":[46],"data.":[47],"apply":[49],"this":[50],"range":[54],"document":[56],"classification":[57],"problems":[58],"show":[60],"it":[62],"compact":[64],"at":[67],"least":[68],"effective":[70],"those":[72],"produced":[73],"by":[74],"support":[75],"vector":[76],"machine":[77],"classifiers":[78],"or":[79],"ridge":[80],"combined":[83],"with":[84],"feature":[85],"selection.":[86],"describe":[88],"our":[89,93],"model":[90],"fitting":[91],"algorithm,":[92],"open":[94],"source":[95],"implementations":[96],"(BBR":[97],"BMR),":[99],"experimental":[101],"results.":[102]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":36},{"year":2023,"cited_by_count":33},{"year":2022,"cited_by_count":55},{"year":2021,"cited_by_count":51},{"year":2020,"cited_by_count":43},{"year":2019,"cited_by_count":52},{"year":2018,"cited_by_count":47},{"year":2017,"cited_by_count":35},{"year":2016,"cited_by_count":37},{"year":2015,"cited_by_count":41},{"year":2014,"cited_by_count":48},{"year":2013,"cited_by_count":51},{"year":2012,"cited_by_count":54}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
