{"id":"https://openalex.org/W2896864700","doi":"https://doi.org/10.1140/epjds/s13688-019-0201-0","title":"Predicting and explaining behavioral data with structured feature space decomposition","display_name":"Predicting and explaining behavioral data with structured feature space decomposition","publication_year":2019,"publication_date":"2019-06-27","ids":{"openalex":"https://openalex.org/W2896864700","doi":"https://doi.org/10.1140/epjds/s13688-019-0201-0","mag":"2896864700"},"language":"en","primary_location":{"id":"doi:10.1140/epjds/s13688-019-0201-0","is_oa":true,"landing_page_url":"https://doi.org/10.1140/epjds/s13688-019-0201-0","pdf_url":"https://epjdatascience.springeropen.com/track/pdf/10.1140/epjds/s13688-019-0201-0.pdf","source":{"id":"https://openalex.org/S2504380752","display_name":"EPJ Data Science","issn_l":"2193-1127","issn":["2193-1127"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EPJ Data Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://epjdatascience.springeropen.com/track/pdf/10.1140/epjds/s13688-019-0201-0.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067731708","display_name":"Peter G. Fennell","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Peter G. Fennell","raw_affiliation_strings":["USC Information Sciences Institute, Marina del Rey, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"USC Information Sciences Institute, Marina del Rey, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086577630","display_name":"Zhiya Zuo","orcid":"https://orcid.org/0000-0002-3771-4731"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Zhiya Zuo","raw_affiliation_strings":["City University of Hong Kong, Kowloon Tong, Hong Kong","USC Information Sciences Institute, Marina del Rey, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"City University of Hong Kong, Kowloon Tong, Hong Kong","institution_ids":["https://openalex.org/I168719708"]},{"raw_affiliation_string":"USC Information Sciences Institute, Marina del Rey, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049634383","display_name":"Kristina Lerman","orcid":"https://orcid.org/0000-0002-5071-0575"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kristina Lerman","raw_affiliation_strings":["USC Information Sciences Institute, Marina del Rey, USA"],"raw_orcid":"https://orcid.org/0000-0002-5071-0575","affiliations":[{"raw_affiliation_string":"USC Information Sciences Institute, Marina del Rey, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5067731708"],"corresponding_institution_ids":[],"apc_list":{"value":1190,"currency":"GBP","value_usd":1459},"apc_paid":{"value":1190,"currency":"GBP","value_usd":1459},"fwci":20.6341,"has_fulltext":true,"cited_by_count":16,"citation_normalized_percentile":{"value":0.99106895,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"8","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.6729549765586853},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6590070724487305},{"id":"https://openalex.org/keywords/outcome","display_name":"Outcome (game theory)","score":0.5949109792709351},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5517393350601196},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.5117166042327881},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5048325657844543},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4897739887237549},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.46540170907974243},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.4615687429904938},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.42821916937828064},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20852217078208923}],"concepts":[{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.6729549765586853},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6590070724487305},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.5949109792709351},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5517393350601196},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.5117166042327881},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5048325657844543},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4897739887237549},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.46540170907974243},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.4615687429904938},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.42821916937828064},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20852217078208923},{"id":"https://openalex.org/C44870925","wikidata":"https://www.wikidata.org/wiki/Q37547","display_name":"Astrophysics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1140/epjds/s13688-019-0201-0","is_oa":true,"landing_page_url":"https://doi.org/10.1140/epjds/s13688-019-0201-0","pdf_url":"https://epjdatascience.springeropen.com/track/pdf/10.1140/epjds/s13688-019-0201-0.pdf","source":{"id":"https://openalex.org/S2504380752","display_name":"EPJ Data Science","issn_l":"2193-1127","issn":["2193-1127"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EPJ Data Science","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:8c976ff26eee4c718561915ccc7b7d41","is_oa":true,"landing_page_url":"https://doaj.org/article/8c976ff26eee4c718561915ccc7b7d41","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"EPJ Data Science, Vol 8, Iss 1, Pp 1-27 (2019)","raw_type":"article"},{"id":"pmh:oai:pure.atira.dk:publications/a0226542-3ea8-422e-bff5-a8ff26b3faa4","is_oa":true,"landing_page_url":"https://hdl.handle.net/2031/a0226542-3ea8-422e-bff5-a8ff26b3faa4","pdf_url":null,"source":{"id":"https://openalex.org/S7407055387","display_name":"CityU Scholars","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Fennell, P G, Zuo, Z & Lerman, K 2019, 'Predicting and explaining behavioral data with structured feature space decomposition', EPJ Data Science, vol. 8, no. 1, 23. https://doi.org/10.1140/epjds/s13688-019-0201-0","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1140/epjds/s13688-019-0201-0","is_oa":true,"landing_page_url":"https://doi.org/10.1140/epjds/s13688-019-0201-0","pdf_url":"https://epjdatascience.springeropen.com/track/pdf/10.1140/epjds/s13688-019-0201-0.pdf","source":{"id":"https://openalex.org/S2504380752","display_name":"EPJ Data Science","issn_l":"2193-1127","issn":["2193-1127"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EPJ Data Science","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.6800000071525574}],"awards":[{"id":"https://openalex.org/G2420683902","display_name":null,"funder_award_id":"W911NF-18-C-0011","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G7183823579","display_name":null,"funder_award_id":"W911NF-17-C-0094","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G7452299184","display_name":null,"funder_award_id":"W911NF","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"}],"funders":[{"id":"https://openalex.org/F4320306183","display_name":"James S. McDonnell Foundation","ror":"https://ror.org/03dy4aq19"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320332815","display_name":"Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320338281","display_name":"Army Research Office","ror":"https://ror.org/05epdh915"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2896864700.pdf","grobid_xml":"https://content.openalex.org/works/W2896864700.grobid-xml"},"referenced_works_count":57,"referenced_works":["https://openalex.org/W970275373","https://openalex.org/W1480376833","https://openalex.org/W1481908410","https://openalex.org/W1527338945","https://openalex.org/W1572247238","https://openalex.org/W1582211066","https://openalex.org/W1594031697","https://openalex.org/W1789783821","https://openalex.org/W1914571458","https://openalex.org/W1937101755","https://openalex.org/W1944586112","https://openalex.org/W1965563190","https://openalex.org/W1974423219","https://openalex.org/W1982076499","https://openalex.org/W2016468753","https://openalex.org/W2029469881","https://openalex.org/W2043890595","https://openalex.org/W2065281378","https://openalex.org/W2078939860","https://openalex.org/W2087347434","https://openalex.org/W2090712000","https://openalex.org/W2094286023","https://openalex.org/W2100534701","https://openalex.org/W2101234009","https://openalex.org/W2102201073","https://openalex.org/W2103525487","https://openalex.org/W2106525823","https://openalex.org/W2114696370","https://openalex.org/W2122825543","https://openalex.org/W2126292488","https://openalex.org/W2128804044","https://openalex.org/W2143570267","https://openalex.org/W2159397589","https://openalex.org/W2290683883","https://openalex.org/W2381775186","https://openalex.org/W2514897959","https://openalex.org/W2547045893","https://openalex.org/W2551317447","https://openalex.org/W2584419678","https://openalex.org/W2585502432","https://openalex.org/W2607893089","https://openalex.org/W2785011159","https://openalex.org/W2787894218","https://openalex.org/W2798714739","https://openalex.org/W2911964244","https://openalex.org/W2922667820","https://openalex.org/W2950353880","https://openalex.org/W2962790223","https://openalex.org/W2963061618","https://openalex.org/W3023695158","https://openalex.org/W3085162807","https://openalex.org/W3099006712","https://openalex.org/W3099109427","https://openalex.org/W3104010597","https://openalex.org/W3105728206","https://openalex.org/W3120740533","https://openalex.org/W3138819813"],"related_works":["https://openalex.org/W2386430105","https://openalex.org/W2356521405","https://openalex.org/W1980381208","https://openalex.org/W2038534795","https://openalex.org/W2384358604","https://openalex.org/W2978999882","https://openalex.org/W1567829292","https://openalex.org/W3001063351","https://openalex.org/W3196905815","https://openalex.org/W2364594919"],"abstract_inverted_index":{"Modeling":[0],"human":[1],"behavioral":[2,64],"data":[3,65,161,190],"is":[4,32,75,209],"challenging":[5],"due":[6],"to":[7,62,110,121,138,146,153,194],"its":[8],"scale,":[9],"sparseness":[10],"(few":[11,22],"observations":[12,23],"per":[13],"individual),":[14],"heterogeneity":[15],"(differently":[16],"behaving":[17],"individuals),":[18],"and":[19,96,123,133,145,174],"class":[20],"imbalance":[21],"of":[24,27,88,100,127,142,156],"the":[25,67,86,89,94,98,114,125,128,140,188],"outcome":[26,129],"interest).":[28],"An":[29],"additional":[30],"challenge":[31],"learning":[33],"an":[34],"interpretable":[35,201],"model":[36],"that":[37,83,108,178,183,203],"not":[38],"only":[39],"accurately":[40],"predicts":[41],"outcomes,":[42],"but":[43,197,221],"also":[44,222],"identifies":[45],"important":[46,81,101,210],"factors":[47],"associated":[48],"with":[49],"a":[50,59,136,226],"given":[51],"behavior.":[52],"To":[53],"address":[54],"these":[55],"challenges,":[56],"we":[57],"describe":[58],"statistical":[60],"approach":[61],"modeling":[63],"called":[66],"structured":[68],"sum-of-squares":[69],"decomposition":[70],"(S3D).":[71],"The":[72],"algorithm,":[73],"which":[74],"inspired":[76],"by":[77],"decision":[78],"trees,":[79],"selects":[80],"features":[82,102,144],"collectively":[84],"explain":[85],"variation":[87],"outcome,":[90],"quantifies":[91],"correlations":[92],"between":[93],"features,":[95],"bins":[97],"subspace":[99,118],"into":[103,206],"smaller,":[104],"more":[105],"homogeneous":[106],"blocks":[107],"correspond":[109],"similarly-behaving":[111],"subgroups":[112],"within":[113],"population.":[115],"This":[116,208],"partitioned":[117],"allows":[119],"us":[120],"predict":[122,185],"analyze":[124],"behavior":[126],"variable":[130],"both":[131],"statistically":[132],"visually,":[134],"giving":[135],"medium":[137],"examine":[139],"effect":[141],"various":[143],"create":[147],"explainable":[148],"predictions.":[149],"We":[150,176],"apply":[151],"S3D":[152,179],"learn":[154],"models":[155,182,202],"online":[157],"activity":[158],"from":[159,163],"large-scale":[160],"collected":[162],"diverse":[164],"sites,":[165],"such":[166],"as":[167],"Stack":[168],"Exchange,":[169],"Khan":[170],"Academy,":[171],"Twitter,":[172],"Duolingo,":[173],"Digg.":[175],"show":[177],"creates":[180],"parsimonious":[181],"can":[184],"outcomes":[186],"in":[187,198],"held-out":[189],"at":[191,215],"levels":[192],"comparable":[193],"state-of-the-art":[195],"approaches,":[196],"addition,":[199],"produces":[200],"provide":[204],"insights":[205],"behaviors.":[207],"for":[211,223],"informing":[212],"strategies":[213],"aimed":[214],"changing":[216],"behavior,":[217],"designing":[218],"social":[219],"systems,":[220],"explaining":[224],"predictions,":[225],"critical":[227],"step":[228],"towards":[229],"minimizing":[230],"algorithmic":[231],"bias.":[232]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":5},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
