{"id":"https://openalex.org/W7125207899","doi":"https://doi.org/10.48550/arxiv.2601.12807","title":"Semi-supervised Instruction Tuning for Large Language Models on Text-Attributed Graphs","display_name":"Semi-supervised Instruction Tuning for Large Language Models on Text-Attributed Graphs","publication_year":2026,"publication_date":"2026-01-19","ids":{"openalex":"https://openalex.org/W7125207899","doi":"https://doi.org/10.48550/arxiv.2601.12807"},"language":"en","primary_location":{"id":"pmh:oai:research-information.bris.ac.uk:openaire_cris_publications/22a763a1-671a-41c5-b3b6-e4f6529103a0","is_oa":false,"landing_page_url":"https://research-information.bris.ac.uk/en/publications/22a763a1-671a-41c5-b3b6-e4f6529103a0","pdf_url":null,"source":{"id":"https://openalex.org/S7407055359","display_name":"Explore Bristol Research","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Song, Z & King, I 2026, Semi-supervised Instruction Tuning for Large Language Models on Text-Attributed Graphs. in Proceedings of the ACM Web Conference 2026. Association for Computing Machinery.","raw_type":"contributionToPeriodical"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.12807","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123179305","display_name":"Zixing Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Song, Zixing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5123516107","display_name":"Irwin King","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"King, Irwin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5123179305"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9746999740600586,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9746999740600586,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.008799999952316284,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.002300000051036477,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6951000094413757},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6951000094413757},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5856999754905701},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5856999754905701},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.49549999833106995},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.49549999833106995},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.46309998631477356},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.46309998631477356},{"id":"https://openalex.org/keywords/transformative-learning","display_name":"Transformative learning","score":0.35359999537467957}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8026000261306763},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8026000261306763},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6951000094413757},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6951000094413757},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5856999754905701},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5856999754905701},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.49549999833106995},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.49549999833106995},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4690999984741211},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4690999984741211},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.46309998631477356},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.46309998631477356},{"id":"https://openalex.org/C70587473","wikidata":"https://www.wikidata.org/wiki/Q7834111","display_name":"Transformative learning","level":2,"score":0.35359999537467957},{"id":"https://openalex.org/C70587473","wikidata":"https://www.wikidata.org/wiki/Q7834111","display_name":"Transformative learning","level":2,"score":0.35359999537467957},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3499999940395355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3499999940395355},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3472000062465668},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3472000062465668},{"id":"https://openalex.org/C76946457","wikidata":"https://www.wikidata.org/wiki/Q504843","display_name":"Graph coloring","level":3,"score":0.3287000060081482},{"id":"https://openalex.org/C76946457","wikidata":"https://www.wikidata.org/wiki/Q504843","display_name":"Graph coloring","level":3,"score":0.3287000060081482},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.2992999851703644},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.2992999851703644},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.2973000109195709},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.2973000109195709},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.296099990606308},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.296099990606308},{"id":"https://openalex.org/C2779982483","wikidata":"https://www.wikidata.org/wiki/Q6094420","display_name":"Iterative refinement","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C2779982483","wikidata":"https://www.wikidata.org/wiki/Q6094420","display_name":"Iterative refinement","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C146380142","wikidata":"https://www.wikidata.org/wiki/Q1137726","display_name":"Directed graph","level":2,"score":0.2572999894618988},{"id":"https://openalex.org/C146380142","wikidata":"https://www.wikidata.org/wiki/Q1137726","display_name":"Directed graph","level":2,"score":0.2572999894618988},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.2524000108242035},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.2524000108242035}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:research-information.bris.ac.uk:openaire_cris_publications/22a763a1-671a-41c5-b3b6-e4f6529103a0","is_oa":false,"landing_page_url":"https://research-information.bris.ac.uk/en/publications/22a763a1-671a-41c5-b3b6-e4f6529103a0","pdf_url":null,"source":{"id":"https://openalex.org/S7407055359","display_name":"Explore Bristol Research","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Song, Z & King, I 2026, Semi-supervised Instruction Tuning for Large Language Models on Text-Attributed Graphs. in Proceedings of the ACM Web Conference 2026. Association for Computing Machinery.","raw_type":"contributionToPeriodical"},{"id":"doi:10.48550/arxiv.2601.12807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.12807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.12807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.12807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7092506289482117,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"emergent":[1],"reasoning":[2],"capabilities":[3],"of":[4,40,82,175],"Large":[5],"Language":[6],"Models":[7],"(LLMs)":[8],"offer":[9],"a":[10,37,105],"transformative":[11],"paradigm":[12],"for":[13,24,62,96,111,163,171],"analyzing":[14],"text-attributed":[15,208],"graphs.":[16],"While":[17],"instruction":[18,74,128,150,199],"tuning":[19,75,129,200],"is":[20,51,67,118,147],"the":[21,55,79,135,145,155,169,172,183,186,216],"prevailing":[22],"method":[23,130],"adapting":[25],"pre-trained":[26],"LLMs":[27,133],"to":[28,77,90,166],"graph":[29,73,127,198,209],"learning":[30],"tasks":[31],"like":[32],"node":[33,188],"classification,":[34],"it":[35,159],"requires":[36],"substantial":[38],"volume":[39],"annotated":[41],"(INSTRUCTION,":[42],"OUTPUT)":[43],"pairs":[44,151],"deriving":[45],"from":[46,154],"labeled":[47,156],"nodes.":[48,157],"This":[49],"requirement":[50],"particularly":[52],"prohibitive":[53],"in":[54],"social":[56],"domain,":[57],"where":[58],"obtaining":[59],"expert":[60],"labels":[61],"sensitive":[63],"or":[64],"evolving":[65],"content":[66],"costly":[68],"and":[69,120],"slow.":[70],"Furthermore,":[71],"standard":[72],"fails":[76],"exploit":[78],"vast":[80],"amount":[81],"unlabeled":[83,164],"nodes,":[84],"which":[85],"contain":[86],"latent":[87],"correlations":[88],"due":[89],"edge":[91],"connections":[92],"that":[93,131,193],"are":[94],"beneficial":[95],"downstream":[97],"predictions.":[98],"To":[99],"bridge":[100],"this":[101,178],"gap,":[102],"we":[103],"propose":[104],"novel":[106],"Semi-supervised":[107],"Instruction":[108],"Tuning":[109],"pipeline":[110],"Graph":[112],"Learning,":[113],"named":[114],"SIT-Graph.":[115],"Notably,":[116],"SIT-Graph":[117,137,202],"model-agnostic":[119],"can":[121],"be":[122],"seamlessly":[123],"integrated":[124],"into":[125,196],"any":[126],"utilizes":[132],"as":[134],"predictor.":[136],"operates":[138],"via":[139],"an":[140],"iterative":[141,179],"self-training":[142],"process.":[143],"Initially,":[144],"model":[146],"fine-tuned":[148],"using":[149],"constructed":[152],"solely":[153],"Then":[158],"generates":[160],"confidence-filtered":[161],"pseudo-responses":[162],"nodes":[165],"strategically":[167],"augment":[168],"dataset":[170],"next":[173],"round":[174],"fine-tuning.":[176],"Finally,":[177],"refinement":[180],"progressively":[181],"aligns":[182],"LLM":[184],"with":[185],"underlying":[187],"correlations.":[189],"Extensive":[190],"experiments":[191],"demonstrate":[192],"when":[194],"incorporated":[195],"state-of-the-art":[197],"methods,":[201],"significantly":[203],"enhances":[204],"their":[205],"performance":[206],"on":[207],"benchmarks,":[210],"achieving":[211],"over":[212],"20%":[213],"improvement":[214],"under":[215],"low":[217],"label":[218],"ratio":[219],"settings.":[220]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-01-22T00:00:00"}
