{"id":"https://openalex.org/W6943890129","doi":"https://doi.org/10.17615/8yhx-gs35","title":"Data Integration Via Analysis of Subspaces","display_name":"Data Integration Via Analysis of Subspaces","publication_year":2021,"publication_date":"2021-08-18","ids":{"openalex":"https://openalex.org/W6943890129","doi":"https://doi.org/10.17615/8yhx-gs35"},"language":"en","primary_location":{"id":"doi:10.17615/8yhx-gs35","is_oa":true,"landing_page_url":"https://doi.org/10.17615/8yhx-gs35","pdf_url":null,"source":{"id":"https://openalex.org/S7407051488","display_name":"UNC Libraries","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"thesis"},"type":"article","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.17615/8yhx-gs35","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Prothero, Jack Benjamin","orcid":null},"institutions":[{"id":"https://openalex.org/I114027177","display_name":"University of North Carolina at Chapel Hill","ror":"https://ror.org/0130frc33","country_code":"US","type":"education","lineage":["https://openalex.org/I114027177"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Prothero, Jack Benjamin","raw_affiliation_strings":["University of North Carolina at Chapel Hill"],"affiliations":[{"raw_affiliation_string":"University of North Carolina at Chapel Hill","institution_ids":["https://openalex.org/I114027177"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I114027177"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.3929841,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12417","display_name":"Morphological variations and asymmetry","score":0.1728000044822693,"subfield":{"id":"https://openalex.org/subfields/2608","display_name":"Geometry and Topology"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12417","display_name":"Morphological variations and asymmetry","score":0.1728000044822693,"subfield":{"id":"https://openalex.org/subfields/2608","display_name":"Geometry and Topology"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.12300000339746475,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.07190000265836716,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/data-integration","display_name":"Data integration","score":0.6682000160217285},{"id":"https://openalex.org/keywords/linear-subspace","display_name":"Linear subspace","score":0.6046000123023987},{"id":"https://openalex.org/keywords/data-type","display_name":"Data type","score":0.43810001015663147},{"id":"https://openalex.org/keywords/terminology","display_name":"Terminology","score":0.4065999984741211},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.39430001378059387},{"id":"https://openalex.org/keywords/data-point","display_name":"Data point","score":0.38190001249313354},{"id":"https://openalex.org/keywords/data-analysis","display_name":"Data analysis","score":0.37770000100135803},{"id":"https://openalex.org/keywords/data-collection","display_name":"Data collection","score":0.3691999912261963}],"concepts":[{"id":"https://openalex.org/C72634772","wikidata":"https://www.wikidata.org/wiki/Q386824","display_name":"Data integration","level":2,"score":0.6682000160217285},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6394000053405762},{"id":"https://openalex.org/C12362212","wikidata":"https://www.wikidata.org/wiki/Q728435","display_name":"Linear subspace","level":2,"score":0.6046000123023987},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4778999984264374},{"id":"https://openalex.org/C138958017","wikidata":"https://www.wikidata.org/wiki/Q190087","display_name":"Data type","level":2,"score":0.43810001015663147},{"id":"https://openalex.org/C547195049","wikidata":"https://www.wikidata.org/wiki/Q1725664","display_name":"Terminology","level":2,"score":0.4065999984741211},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.39430001378059387},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.38909998536109924},{"id":"https://openalex.org/C21080849","wikidata":"https://www.wikidata.org/wiki/Q13611879","display_name":"Data point","level":2,"score":0.38190001249313354},{"id":"https://openalex.org/C175801342","wikidata":"https://www.wikidata.org/wiki/Q1988917","display_name":"Data analysis","level":2,"score":0.37770000100135803},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.3691999912261963},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.3610999882221222},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3395000100135803},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33309999108314514},{"id":"https://openalex.org/C138827492","wikidata":"https://www.wikidata.org/wiki/Q6661985","display_name":"Data processing","level":2,"score":0.33230000734329224},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.3292999863624573},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3278000056743622},{"id":"https://openalex.org/C91682802","wikidata":"https://www.wikidata.org/wiki/Q620538","display_name":"Multidimensional scaling","level":2,"score":0.30410000681877136},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.299699991941452},{"id":"https://openalex.org/C16910744","wikidata":"https://www.wikidata.org/wiki/Q7705759","display_name":"Test data","level":2,"score":0.2888000011444092},{"id":"https://openalex.org/C132010649","wikidata":"https://www.wikidata.org/wiki/Q189222","display_name":"Intuition","level":2,"score":0.2775000035762787},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C120894424","wikidata":"https://www.wikidata.org/wiki/Q1322871","display_name":"Exploratory data analysis","level":2,"score":0.27309998869895935},{"id":"https://openalex.org/C150670458","wikidata":"https://www.wikidata.org/wiki/Q4272815","display_name":"Data transformation","level":3,"score":0.2662000060081482},{"id":"https://openalex.org/C137314826","wikidata":"https://www.wikidata.org/wiki/Q2330408","display_name":"Data mapping","level":2,"score":0.262800008058548}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.17615/8yhx-gs35","is_oa":true,"landing_page_url":"https://doi.org/10.17615/8yhx-gs35","pdf_url":null,"source":{"id":"https://openalex.org/S7407051488","display_name":"UNC Libraries","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"thesis"}],"best_oa_location":{"id":"doi:10.17615/8yhx-gs35","is_oa":true,"landing_page_url":"https://doi.org/10.17615/8yhx-gs35","pdf_url":null,"source":{"id":"https://openalex.org/S7407051488","display_name":"UNC Libraries","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"thesis"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Modern":[0],"data":[1,25,27,34,44,49,59,72,131,149,153,207,212,220],"collection":[2],"in":[3,57,97,105,147],"bioinformatics":[4],"and":[5,37,45,52,109,152,160,172,211,225],"other":[6],"big-data":[7],"paradigms":[8],"often":[9],"incorporates":[10],"traits":[11],"derived":[12],"from":[13],"multiple":[14],"different":[15,48],"points":[16],"of":[17,19,33,71,90,124,139,145,174,192,195,201],"view":[18],"the":[20,169],"observations.":[21],"We":[22,134,155,166,181],"call":[23],"this":[24],"multi-view":[26],"or":[28,128],"multi-block":[29,43,84,219],"data.":[30],"The":[31],"field":[32],"integration":[35,60],"develops":[36],"applies":[38],"new":[39,95,161,185],"methods":[40],"for":[41,79,115,163,197,205],"studying":[42],"identifying":[46],"how":[47],"blocks":[50],"relate":[51],"differ.":[53],"One":[54],"major":[55],"frontier":[56],"contemporary":[58],"research":[61],"is":[62,130,203],"methodology":[63],"that":[64,136],"can":[65,141],"identify":[66],"partially-shared":[67,81,117],"structure":[68,82],"between":[69],"sub-collections":[70],"blocks.":[73],"This":[74],"thesis":[75],"presents":[76],"our":[77],"method":[78],"locating":[80],"among":[83],"data:":[85],"Data":[86],"Integration":[87],"Via":[88],"Analysis":[89],"Subspaces":[91],"(DIVAS).":[92],"DIVAS":[93,210],"combines":[94],"insights":[96],"angular":[98],"subspace":[99],"perturbation":[100],"theory":[101],"with":[102,178],"recent":[103],"developments":[104],"matrix":[106,132,213],"signal":[107],"processing":[108],"convex-concave":[110],"optimization":[111],"into":[112],"one":[113],"algorithm":[114],"parsing":[116],"structure.":[118],"An":[119],"ever-present":[120],"yet":[121],"under-examined":[122],"aspect":[123],"statistical":[125],"analysis,":[126],"integrative":[127],"otherwise,":[129],"centering.":[133],"find":[135],"additional":[137],"forms":[138],"centering":[140,164,176,202,214],"produce":[142],"novel":[143],"modes":[144],"variation":[146],"functional":[148],"analysis":[150],"(FDA)":[151],"integration.":[154],"propose":[156,183],"a":[157,184,193,206],"unified":[158],"framework":[159],"terminology":[162],"operations.":[165],"clearly":[167],"demonstrate":[168],"intuition":[170],"behind":[171],"consequences":[173],"each":[175],"choice":[177,200],"informative":[179],"graphics.":[180],"also":[182],"direction":[186],"energy":[187],"hypothesis":[188],"test":[189],"as":[190],"part":[191],"series":[194],"diagnostics":[196],"determining":[198],"which":[199],"best":[204],"set.":[208],"Both":[209],"are":[215],"illustrated":[216],"throughout":[217],"using":[218],"sets":[221],"concerning":[222],"cancer":[223],"genomics":[224],"20th":[226],"century":[227],"mortality.":[228]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
