{"id":"https://openalex.org/W4312226134","doi":"https://doi.org/10.48550/arxiv.2212.12771","title":"Unsupervised Instance and Subnetwork Selection for Network Data","display_name":"Unsupervised Instance and Subnetwork Selection for Network Data","publication_year":2022,"publication_date":"2022-12-24","ids":{"openalex":"https://openalex.org/W4312226134","doi":"https://doi.org/10.48550/arxiv.2212.12771"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2212.12771","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.12771","pdf_url":"https://arxiv.org/pdf/2212.12771","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2212.12771","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100351875","display_name":"Lin Zhang","orcid":"https://orcid.org/0000-0002-7404-5231"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Lin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064776075","display_name":"Nicholas Moskwa","orcid":"https://orcid.org/0000-0002-9819-9227"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Moskwa, Nicholas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087618896","display_name":"Melinda Larsen","orcid":"https://orcid.org/0000-0002-5026-2012"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Larsen, Melinda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5001272357","display_name":"Petko Bogdanov","orcid":"https://orcid.org/0000-0001-6310-3224"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bogdanov, Petko","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100351875"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10836","display_name":"Metabolomics and Mass Spectrometry Studies","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10836","display_name":"Metabolomics and Mass Spectrometry Studies","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.988099992275238,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9861000180244446,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/subnetwork","display_name":"Subnetwork","score":0.9245901107788086},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7868170738220215},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.6865053176879883},{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.5221638679504395},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5214033126831055},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5076106786727905},{"id":"https://openalex.org/keywords/snapshot","display_name":"Snapshot (computer storage)","score":0.49507513642311096},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.46028557419776917},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.43449175357818604},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.16412478685379028}],"concepts":[{"id":"https://openalex.org/C2780186347","wikidata":"https://www.wikidata.org/wiki/Q11414","display_name":"Subnetwork","level":2,"score":0.9245901107788086},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7868170738220215},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.6865053176879883},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.5221638679504395},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5214033126831055},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5076106786727905},{"id":"https://openalex.org/C55282118","wikidata":"https://www.wikidata.org/wiki/Q252683","display_name":"Snapshot (computer storage)","level":2,"score":0.49507513642311096},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.46028557419776917},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.43449175357818604},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.16412478685379028},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2212.12771","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.12771","pdf_url":"https://arxiv.org/pdf/2212.12771","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2212.12771","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2212.12771","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2212.12771","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.12771","pdf_url":"https://arxiv.org/pdf/2212.12771","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.7300000190734863,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"},{"id":"https://openalex.org/F4320337391","display_name":"Division of Civil, Mechanical and Manufacturing Innovation","ror":"https://ror.org/028yd4c30"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4312226134.pdf","grobid_xml":"https://content.openalex.org/works/W4312226134.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2060724872","https://openalex.org/W2082094785","https://openalex.org/W2202198356","https://openalex.org/W3087203342","https://openalex.org/W2377184161","https://openalex.org/W228984114","https://openalex.org/W4226360758","https://openalex.org/W2090026684","https://openalex.org/W2907567977","https://openalex.org/W4320039951"],"abstract_inverted_index":{"Unlike":[0],"tabular":[1],"data,":[2,100],"features":[3],"in":[4,30,98,153],"network":[5,25,80,99,111,155],"data":[6,35,81,142],"are":[7],"interconnected":[8],"within":[9,88],"a":[10,22,31,104],"domain-specific":[11],"graph.":[12],"Examples":[13],"of":[14,41],"this":[15],"setting":[16],"include":[17],"gene":[18],"expression":[19],"overlaid":[20],"on":[21,124,139],"protein":[23],"interaction":[24],"(PPI)":[26],"and":[27,43,49,57,76,95,129,163],"user":[28],"opinions":[29],"social":[32],"network.":[33],"Network":[34],"is":[36,54],"typically":[37],"high-dimensional":[38],"(large":[39],"number":[40],"nodes)":[42],"often":[44,55],"contains":[45],"outlier":[46],"snapshot":[47],"instances":[48,61,78,116],"noise.":[50],"In":[51],"addition,":[52],"it":[53,160],"non-trivial":[56],"time-consuming":[58],"to":[59,135],"annotate":[60],"with":[62],"global":[63],"labels":[64],"(e.g.,":[65],"disease":[66],"or":[67],"normal).":[68],"How":[69],"can":[70],"we":[71,144],"jointly":[72],"select":[73],"discriminative":[74,126],"subnetworks":[75],"representative":[77,115,130],"for":[79,92,146,150],"without":[82],"supervision?":[83],"We":[84],"address":[85],"these":[86],"challenges":[87],"an":[89,109],"unsupervised":[90],"framework":[91],"joint":[93],"subnetwork":[94,127],"instance":[96,131],"selection":[97,128],"called":[101],"UISS,":[102],"via":[103],"convex":[105],"self-representation":[106],"objective.":[107],"Given":[108],"unlabeled":[110],"dataset,":[112],"UISS":[113],"identifies":[114],"while":[117],"ignoring":[118],"outliers.":[119],"It":[120],"outperforms":[121],"state-of-the-art":[122],"baselines":[123],"both":[125],"selection,":[132],"achieving":[133],"up":[134],"10%":[136],"accuracy":[137],"improvement":[138],"all":[140],"real-world":[141],"sets":[143],"use":[145],"evaluation.":[147],"When":[148],"employed":[149],"exploratory":[151],"analysis":[152],"RNA-seq":[154],"samples":[156],"from":[157],"multiple":[158],"studies":[159],"produces":[161],"interpretable":[162],"informative":[164],"summaries.":[165]},"counts_by_year":[],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
