{"id":"https://openalex.org/W4406496861","doi":"https://doi.org/10.1109/bigdata62323.2024.10826033","title":"Inferring Relationships between Tabular Data and Topics using LLM for a Dataset Search Task","display_name":"Inferring Relationships between Tabular Data and Topics using LLM for a Dataset Search Task","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406496861","doi":"https://doi.org/10.1109/bigdata62323.2024.10826033"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10826033","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10826033","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043268072","display_name":"Yukihisa Fujita","orcid":"https://orcid.org/0000-0002-0581-5116"},"institutions":[{"id":"https://openalex.org/I4210137853","display_name":"Toyota Motor Corporation (Japan)","ror":"https://ror.org/02zqm6r10","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210125472","https://openalex.org/I4210137853"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yukihisa Fujita","raw_affiliation_strings":["Toyota Motor Corporation,Social System PF Development Division,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"Toyota Motor Corporation,Social System PF Development Division,Tokyo,Japan","institution_ids":["https://openalex.org/I4210137853"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015928651","display_name":"Teruaki Hayashi","orcid":"https://orcid.org/0000-0002-1806-5852"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Teruaki Hayashi","raw_affiliation_strings":["The University of Tokyo,Graduate School of Engineering,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"The University of Tokyo,Graduate School of Engineering,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049693274","display_name":"Masahiro Kuwahara","orcid":"https://orcid.org/0000-0003-2896-8622"},"institutions":[{"id":"https://openalex.org/I4210137853","display_name":"Toyota Motor Corporation (Japan)","ror":"https://ror.org/02zqm6r10","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210125472","https://openalex.org/I4210137853"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masahiro Kuwahara","raw_affiliation_strings":["Toyota Motor Corporation,Social System PF Development Division,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"Toyota Motor Corporation,Social System PF Development Division,Tokyo,Japan","institution_ids":["https://openalex.org/I4210137853"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5043268072"],"corresponding_institution_ids":["https://openalex.org/I4210137853"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.32183276,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"6564","last_page":"6573"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9811999797821045,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9769999980926514,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7559729814529419},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7190756797790527},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.46773582696914673},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4217660129070282},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.368878036737442},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.06179174780845642}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7559729814529419},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7190756797790527},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.46773582696914673},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4217660129070282},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.368878036737442},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.06179174780845642},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10826033","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10826033","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W1583837637","https://openalex.org/W2301363727","https://openalex.org/W2610332888","https://openalex.org/W2750779823","https://openalex.org/W2899286282","https://openalex.org/W2914304175","https://openalex.org/W2926805670","https://openalex.org/W2969723769","https://openalex.org/W3102264439","https://openalex.org/W3103667349","https://openalex.org/W3196904276","https://openalex.org/W4205922070","https://openalex.org/W4252681483","https://openalex.org/W4254188649","https://openalex.org/W4284700914","https://openalex.org/W4384662964","https://openalex.org/W4385245566","https://openalex.org/W4396843721","https://openalex.org/W4400529822","https://openalex.org/W4404781897","https://openalex.org/W4406458261","https://openalex.org/W6778883912","https://openalex.org/W6780992466","https://openalex.org/W6791361287","https://openalex.org/W6794246295","https://openalex.org/W6809646742","https://openalex.org/W6840081018","https://openalex.org/W6849563483","https://openalex.org/W6849640182","https://openalex.org/W6860429519","https://openalex.org/W6882228985"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"In":[0,127],"the":[1,52,55,61,78,101,107,134,146,178,188,197,201],"big":[2],"data":[3,5,23,33,63,135],"era,":[4],"is":[6,29,104],"called":[7],"new":[8,49],"oil":[9],"and":[10,16,21,27,38,91,114,119,125,171,225],"essential":[11],"things":[12],"in":[13,54],"both":[14],"business":[15,39],"academic":[17],"fields.":[18],"Both":[19],"private":[20],"public":[22],"are":[24,34,66,74],"continuously":[25],"increasing":[26],"it":[28],"expected":[30],"that":[31,105,163,196],"such":[32,93],"used":[35],"for":[36,44,69,150,154,187],"innovation":[37],"improvement.":[40],"However,":[41],"finding":[42,62],"datasets":[43,115,153,184],"specific":[45,208],"purposes":[46],"becomes":[47],"a":[48,110,120,139,207],"challenge":[50],"with":[51,168],"increase":[53],"variety":[56],"of":[57,77,80,86,88,100,112,123,165,210],"data.":[58],"To":[59],"support":[60],"task,":[64],"there":[65],"some":[67],"studies":[68],"dataset":[70,155,189],"search;":[71],"however,":[72],"they":[73],"immature":[75],"because":[76],"lack":[79],"appropriate":[81],"evaluation":[82,193],"datasets,":[83,90],"which":[84,204],"consist":[85],"sets":[87],"queries,":[89],"labels,":[92],"as":[94],"other":[95],"machine":[96],"learning":[97],"areas.":[98],"One":[99],"major":[102],"obstacles":[103],"annotating":[106],"labels":[108],"to":[109,132,144,213],"pair":[111],"queries":[113],"requires":[116],"specialized":[117],"expertise":[118],"substantial":[121],"investment":[122],"time":[124],"effort.":[126],"this":[128],"study,":[129],"we":[130],"aim":[131],"automate":[133],"annotation":[136,161,167],"process":[137],"using":[138],"large":[140],"language":[141],"model":[142],"(LLM)":[143],"reduce":[145],"manual":[147],"effort":[148],"required":[149],"creating":[151],"annotated":[152,183],"search":[156,190],"tasks.":[157],"We":[158,176],"propose":[159],"an":[160],"framework":[162,180,199],"consists":[164],"LLM":[166],"table":[169],"compression":[170],"multiple":[172],"results":[173,194],"aggregation":[174],"mechanism.":[175],"evaluated":[177],"proposed":[179,198],"by":[181],"human":[182,227],"previously":[185],"published":[186],"challenge.":[191],"The":[192],"show":[195],"outperformed":[200],"baseline":[202],"method,":[203],"input":[205],"simply":[206],"number":[209],"head":[211],"rows":[212],"LLM.":[214],"Moreover,":[215],"our":[216],"qualitative":[217],"analysis":[218],"gives":[219],"insights":[220],"into":[221],"improving":[222],"LLM-based":[223],"systems":[224],"replacing":[226],"annotators.":[228]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
