{"id":"https://openalex.org/W4385568197","doi":"https://doi.org/10.1145/3580305.3599366","title":"GetPt: Graph-enhanced General Table Pre-training with Alternate Attention Network","display_name":"GetPt: Graph-enhanced General Table Pre-training with Alternate Attention Network","publication_year":2023,"publication_date":"2023-08-04","ids":{"openalex":"https://openalex.org/W4385568197","doi":"https://doi.org/10.1145/3580305.3599366"},"language":"en","primary_location":{"id":"doi:10.1145/3580305.3599366","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3580305.3599366","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102878647","display_name":"Ran Jia","orcid":"https://orcid.org/0009-0004-3540-5910"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ran Jia","raw_affiliation_strings":["Microsoft, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0004-3540-5910","affiliations":[{"raw_affiliation_string":"Microsoft, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007667549","display_name":"Haoming Guo","orcid":"https://orcid.org/0009-0000-3168-4167"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Haoming Guo","raw_affiliation_strings":["University of California, Berkeley, Berkeley, CA, USA"],"raw_orcid":"https://orcid.org/0009-0000-3168-4167","affiliations":[{"raw_affiliation_string":"University of California, Berkeley, Berkeley, CA, USA","institution_ids":["https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101399603","display_name":"Xiaoyuan Jin","orcid":"https://orcid.org/0009-0006-9191-9275"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Xiaoyuan Jin","raw_affiliation_strings":["ETH Z\u00fcrich, Z\u00fcrich, Switzerland"],"raw_orcid":"https://orcid.org/0009-0006-9191-9275","affiliations":[{"raw_affiliation_string":"ETH Z\u00fcrich, Z\u00fcrich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101564263","display_name":"Chao Yan","orcid":"https://orcid.org/0000-0001-5929-8233"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Yan","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-5929-8233","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008387608","display_name":"Lun Du","orcid":"https://orcid.org/0000-0002-7625-0650"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lun Du","raw_affiliation_strings":["Microsoft, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-7625-0650","affiliations":[{"raw_affiliation_string":"Microsoft, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052953923","display_name":"Xiaojun Ma","orcid":"https://orcid.org/0000-0001-6757-3055"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaojun Ma","raw_affiliation_strings":["Microsoft, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-6757-3055","affiliations":[{"raw_affiliation_string":"Microsoft, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103218676","display_name":"Tamara Stankovic","orcid":"https://orcid.org/0009-0007-0644-7398"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tamara Stankovic","raw_affiliation_strings":["Microsoft, Belgrade, Serbia"],"raw_orcid":"https://orcid.org/0009-0007-0644-7398","affiliations":[{"raw_affiliation_string":"Microsoft, Belgrade, Serbia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092595903","display_name":"Marko Lozajic","orcid":"https://orcid.org/0009-0006-2234-1692"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marko Lozajic","raw_affiliation_strings":["Microsoft, Belgrade, Serbia"],"raw_orcid":"https://orcid.org/0009-0006-2234-1692","affiliations":[{"raw_affiliation_string":"Microsoft, Belgrade, Serbia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092595904","display_name":"Goran Zoranovic","orcid":"https://orcid.org/0009-0005-0560-8327"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goran Zoranovic","raw_affiliation_strings":["Microsoft, Belgrade, Serbia"],"raw_orcid":"https://orcid.org/0009-0005-0560-8327","affiliations":[{"raw_affiliation_string":"Microsoft, Belgrade, Serbia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063172118","display_name":"Igor Ilic","orcid":"https://orcid.org/0009-0002-5119-7993"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Igor Ilic","raw_affiliation_strings":["Microsoft, Belgrade, Serbia"],"raw_orcid":"https://orcid.org/0009-0002-5119-7993","affiliations":[{"raw_affiliation_string":"Microsoft, Belgrade, Serbia","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006300825","display_name":"Shi Han","orcid":"https://orcid.org/0000-0002-0360-6089"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shi Han","raw_affiliation_strings":["Microsoft, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-0360-6089","affiliations":[{"raw_affiliation_string":"Microsoft, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100331488","display_name":"Dongmei Zhang","orcid":"https://orcid.org/0000-0002-9230-2799"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongmei Zhang","raw_affiliation_strings":["Microsoft, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-9230-2799","affiliations":[{"raw_affiliation_string":"Microsoft, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5102878647"],"corresponding_institution_ids":["https://openalex.org/I4210113369"],"apc_list":null,"apc_paid":null,"fwci":0.7397,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.74319386,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"941","last_page":"950"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8461956977844238},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.7312639951705933},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.4583124816417694},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4465470314025879},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.43016886711120605},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.4270821213722229},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.38433679938316345},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37282314896583557},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3432488739490509},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.22140595316886902}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8461956977844238},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.7312639951705933},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.4583124816417694},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4465470314025879},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.43016886711120605},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.4270821213722229},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.38433679938316345},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37282314896583557},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3432488739490509},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.22140595316886902},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3580305.3599366","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3580305.3599366","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W2002252784","https://openalex.org/W2021167849","https://openalex.org/W2081580037","https://openalex.org/W2115253074","https://openalex.org/W2138556038","https://openalex.org/W2290320465","https://openalex.org/W2398606196","https://openalex.org/W2604225376","https://openalex.org/W3003206728","https://openalex.org/W3035140194","https://openalex.org/W3093787307","https://openalex.org/W3129639992","https://openalex.org/W3153032435","https://openalex.org/W3155299751","https://openalex.org/W3157891451","https://openalex.org/W3162752841","https://openalex.org/W3165753548","https://openalex.org/W3168052339","https://openalex.org/W3173486678","https://openalex.org/W3176384932","https://openalex.org/W3211394146","https://openalex.org/W4226189435","https://openalex.org/W4304098321"],"related_works":["https://openalex.org/W4241523039","https://openalex.org/W2360028903","https://openalex.org/W4280543773","https://openalex.org/W178231042","https://openalex.org/W2366083136","https://openalex.org/W2387622493","https://openalex.org/W1932132538","https://openalex.org/W2357832196","https://openalex.org/W1566252468","https://openalex.org/W4200375594"],"abstract_inverted_index":{"Tables":[0],"are":[1,72],"widely":[2],"used":[3],"for":[4,39,49,95],"data":[5,28],"storage":[6],"and":[7,23,58,106,144,172,190,201,212],"presentation":[8],"due":[9],"to":[10,101,113,122,139,157],"their":[11,77],"high":[12],"flexibility":[13],"in":[14],"layout.":[15],"The":[16],"importance":[17],"of":[18,26,34,44,52,120,126,146,166,181],"tables":[19,57,59,64,75,102],"as":[20,55],"information":[21,162],"carriers":[22],"the":[24,45,124,127,131,142,147,152,160,173,192],"complexity":[25],"tabular":[27,40],"understanding":[29],"attract":[30],"a":[31,91,111,114,133,167,178,195],"great":[32],"deal":[33],"research":[35],"on":[36,130,194,205,224],"large-scale":[37],"pre-training":[38,93,188],"data.":[41],"However,":[42],"most":[43],"works":[46],"design":[47],"models":[48],"specific":[50],"types":[51,119],"tables,":[53],"such":[54,74],"relational":[56],"with":[60,65,103,117],"well-structured":[61],"headers,":[62],"neglecting":[63],"complex":[66,104],"layouts.":[67,107],"In":[68,85],"real-world":[69],"scenarios,":[70],"there":[71],"many":[73],"beyond":[76],"target":[78],"scope":[79],"that":[80,218],"cannot":[81],"be":[82],"well":[83],"supported.":[84],"this":[86],"paper,":[87],"we":[88,109,150,184],"propose":[89],"GetPt,":[90],"unified":[92],"architecture":[94],"general":[96],"table":[97,112,168,197,209,213],"representation":[98],"applicable":[99],"even":[100],"structures":[105],"First,":[108],"convert":[110],"heterogeneous":[115],"graph":[116],"multiple":[118,164],"edges":[121],"represent":[123],"layout":[125],"table.":[128,148,174],"Based":[129],"graph,":[132],"specially":[134],"designed":[135],"transformer":[136],"is":[137],"applied":[138],"jointly":[140],"model":[141,159,193,204],"semantics":[143],"structure":[145,214],"Second,":[149],"devise":[151],"Alternate":[153],"Attention":[154],"Network":[155],"(AAN)":[156],"better":[158,176],"contextual":[161],"across":[163],"granularities":[165],"including":[169],"tokens,":[170],"cells,":[171],"To":[175],"support":[177],"wide":[179],"range":[180],"downstream":[182],"tasks,":[183,208],"further":[185],"employ":[186],"three":[187],"objectives":[189],"pre-train":[191],"large":[196],"dataset.":[198],"We":[199],"fine-tune":[200],"evaluate":[202],"GetPt":[203,219],"two":[206],"representative":[207],"type":[210],"classification,":[211],"recognition.":[215],"Experiments":[216],"show":[217],"outperforms":[220],"existing":[221],"state-of-the-art":[222],"methods":[223],"these":[225],"tasks.":[226]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
