{"id":"https://openalex.org/W4282571347","doi":"https://doi.org/10.1145/3514221.3520174","title":"Demonstrating ASET: Ad-hoc Structured Exploration of Text Collections","display_name":"Demonstrating ASET: Ad-hoc Structured Exploration of Text Collections","publication_year":2022,"publication_date":"2022-06-10","ids":{"openalex":"https://openalex.org/W4282571347","doi":"https://doi.org/10.1145/3514221.3520174"},"language":"en","primary_location":{"id":"doi:10.1145/3514221.3520174","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3514221.3520174","pdf_url":null,"source":{"id":"https://openalex.org/S4363608845","display_name":"Proceedings of the 2022 International Conference on Management of Data","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 International Conference on Management of Data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021190212","display_name":"Benjamin H\u00e4ttasch","orcid":"https://orcid.org/0000-0001-8949-3611"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Benjamin H\u00e4ttasch","raw_affiliation_strings":["Technical University of Darmstadt, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Technical University of Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001221750","display_name":"Jan-Micha Bodensohn","orcid":"https://orcid.org/0000-0003-4884-0300"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jan-Micha Bodensohn","raw_affiliation_strings":["Technical University of Darmstadt, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Technical University of Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073504200","display_name":"Carsten Binnig","orcid":"https://orcid.org/0000-0002-2744-7836"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Carsten Binnig","raw_affiliation_strings":["Technical University of Darmstadt, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Technical University of Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5021190212"],"corresponding_institution_ids":["https://openalex.org/I31512782"],"apc_list":null,"apc_paid":null,"fwci":0.5147,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.53186931,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"2393","last_page":"2396"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8878675103187561},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.684625506401062},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5570797324180603},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5424150228500366},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.43475422263145447},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.35001641511917114},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.216698557138443}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8878675103187561},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.684625506401062},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5570797324180603},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5424150228500366},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.43475422263145447},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.35001641511917114},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.216698557138443},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3514221.3520174","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3514221.3520174","pdf_url":null,"source":{"id":"https://openalex.org/S4363608845","display_name":"Proceedings of the 2022 International Conference on Management of Data","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 International Conference on Management of Data","raw_type":"proceedings-article"},{"id":"pmh:oai:tubiblio.ulb.tu-darmstadt.de:138095","is_oa":false,"landing_page_url":"http://tubiblio.ulb.tu-darmstadt.de/138095/","pdf_url":null,"source":{"id":"https://openalex.org/S4377196390","display_name":"TUbilio (Technical University of Darmstadt)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I31512782","host_organization_name":"Technische Universit\u00e4t Darmstadt","host_organization_lineage":["https://openalex.org/I31512782"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Konferenzver\u00f6ffentlichung"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7099999785423279,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W1529731474","https://openalex.org/W2741609678","https://openalex.org/W2765782497","https://openalex.org/W2959026463","https://openalex.org/W3035327456","https://openalex.org/W3038098779","https://openalex.org/W3103981637","https://openalex.org/W4313371817"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W4394360958","https://openalex.org/W2948670949","https://openalex.org/W4288047943","https://openalex.org/W4394193569","https://openalex.org/W1797990060","https://openalex.org/W1972035260","https://openalex.org/W4232484699","https://openalex.org/W2473636215","https://openalex.org/W4242025311"],"abstract_inverted_index":{"In":[0,80],"this":[1],"demo,":[2],"we":[3],"present":[4],"ASET,":[5],"a":[6,57,64,81,88,97,113,136],"novel":[7,89],"tool":[8],"to":[9,34,44,55,92,96,126],"explore":[10,127],"the":[11,32,39,70,94,104,109,148],"contents":[12],"of":[13,48,66,147],"unstructured":[14],"data":[15],"(text)":[16],"by":[17,103],"automatically":[18],"transforming":[19],"relevant":[20],"parts":[21],"into":[22],"tabular":[23],"form.":[24],"ASET":[25,110,142],"works":[26],"in":[27,135],"an":[28,144],"ad-hoc":[29],"manner":[30],"without":[31,120],"need":[33],"curate":[35],"extraction":[36],"pipelines":[37],"for":[38],"(unseen)":[40],"text":[41,128],"collection":[42],"or":[43,123],"annotate":[45],"large":[46],"amounts":[47],"training":[49],"data.":[50],"The":[51],"main":[52],"idea":[53],"is":[54],"use":[56],"new":[58],"two-phased":[59],"approach":[60],"that":[61,117],"first":[62],"extracts":[63],"superset":[65],"information":[67],"nuggets":[68],"from":[69],"texts":[71],"using":[72],"existing":[73],"extractors":[74],"such":[75],"as":[76,101],"named":[77],"entity":[78],"recognizers.":[79],"second":[82],"step,":[83],"it":[84],"leverages":[85],"embeddings":[86],"and":[87,138,141],"matching":[90],"strategy":[91],"match":[93],"extractions":[95],"structured":[98],"table":[99],"definition":[100],"requested":[102],"user.":[105],"This":[106,131],"demo":[107],"features":[108],"system":[111],"with":[112],"graphical":[114],"user":[115],"interface":[116],"allows":[118],"people":[119],"machine":[121],"learning":[122],"programming":[124],"expertise":[125],"collections":[129],"efficiently.":[130],"can":[132],"be":[133],"done":[134],"self-directed":[137],"flexible":[139],"manner,":[140],"provides":[143],"intuitive":[145],"impression":[146],"result":[149],"quality.":[150]},"counts_by_year":[{"year":2024,"cited_by_count":2}],"updated_date":"2026-02-26T08:16:20.718346","created_date":"2025-10-10T00:00:00"}
