{"id":"https://openalex.org/W7161135341","doi":"https://doi.org/10.1016/j.neucom.2026.133935","title":"Active perception: Gaze-guided thinking for chart understanding","display_name":"Active perception: Gaze-guided thinking for chart understanding","publication_year":2026,"publication_date":"2026-05-15","ids":{"openalex":"https://openalex.org/W7161135341","doi":"https://doi.org/10.1016/j.neucom.2026.133935"},"language":"en","primary_location":{"id":"doi:10.1016/j.neucom.2026.133935","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.neucom.2026.133935","pdf_url":null,"source":{"id":"https://openalex.org/S45693802","display_name":"Neurocomputing","issn_l":"0925-2312","issn":["0925-2312","1872-8286"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neurocomputing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.neucom.2026.133935","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136162914","display_name":"Xin Huang","orcid":"https://orcid.org/0000-0001-7180-7002"},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]},{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN","JP"],"is_corresponding":true,"raw_author_name":"Xin Huang","raw_affiliation_strings":["Stepfun, ShangHai, China","Waseda University, Fukuoka, Japan"],"raw_orcid":"https://orcid.org/0000-0001-7180-7002","affiliations":[{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]},{"raw_affiliation_string":"Waseda University, Fukuoka, Japan","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102314711","display_name":"Huang Yuanyuan","orcid":null},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yuanyuan Huang","raw_affiliation_strings":["Waseda University, Fukuoka, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Waseda University, Fukuoka, Japan","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100431047","display_name":"Yongliang Wang","orcid":"https://orcid.org/0000-0001-7263-9493"},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yongliang Wang","raw_affiliation_strings":["Waseda University, Fukuoka, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Waseda University, Fukuoka, Japan","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085546117","display_name":"Ziyang Meng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziyang Meng","raw_affiliation_strings":["Stepfun, ShangHai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100641008","display_name":"Hongbing Li","orcid":"https://orcid.org/0000-0003-2420-3104"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]},{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongbing Li","raw_affiliation_strings":["Beijing University of Posts and Telecommunications, BeiJing, China","Stepfun, ShangHai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications, BeiJing, China","institution_ids":["https://openalex.org/I139759216"]},{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136096245","display_name":"Zejia Weng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zejia Weng","raw_affiliation_strings":["Stepfun, ShangHai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136132894","display_name":"Jia Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jia Wang","raw_affiliation_strings":["Stepfun, ShangHai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136180381","display_name":"Yeqing Shen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yeqing Shen","raw_affiliation_strings":["Stepfun, ShangHai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136096354","display_name":"Haolong Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]},{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haolong Yan","raw_affiliation_strings":["Beijing University of Posts and Telecommunications, BeiJing, China","Stepfun, ShangHai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications, BeiJing, China","institution_ids":["https://openalex.org/I139759216"]},{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136137427","display_name":"Kaijun Tan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaijun Tan","raw_affiliation_strings":["Stepfun, ShangHai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136146114","display_name":"Zheng Ge","orcid":null},"institutions":[{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zheng Ge","raw_affiliation_strings":["Stepfun, ShangHai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136102909","display_name":"Xiangyu Tony Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangyu Zhang","raw_affiliation_strings":["Stepfun, ShangHai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136145509","display_name":"Daxin Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210140476","display_name":"Shanghai Zhaozhan Metal Materials","ror":"https://ror.org/03wtw1749","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210140476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Daxin Jiang","raw_affiliation_strings":["Stepfun, ShangHai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Stepfun, ShangHai, China","institution_ids":["https://openalex.org/I4210140476"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5136097290","display_name":"Osamu Yoshie","orcid":null},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Osamu Yoshie","raw_affiliation_strings":["Waseda University, Fukuoka, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Waseda University, Fukuoka, Japan","institution_ids":["https://openalex.org/I150744194"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":14,"corresponding_author_ids":["https://openalex.org/A5136097290","https://openalex.org/A5136162914"],"corresponding_institution_ids":["https://openalex.org/I150744194","https://openalex.org/I4210140476"],"apc_list":{"value":2470,"currency":"USD","value_usd":2470},"apc_paid":{"value":2470,"currency":"USD","value_usd":2470},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.89565519,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"695","issue":null,"first_page":"133935","last_page":"133935"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.19920000433921814,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.19920000433921814,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11516","display_name":"Visual and Cognitive Learning Processes","score":0.049300000071525574,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10982","display_name":"Motor Control and Adaptation","score":0.039000000804662704,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/chart","display_name":"Chart","score":0.6299999952316284},{"id":"https://openalex.org/keywords/control-chart","display_name":"Control chart","score":0.357699990272522},{"id":"https://openalex.org/keywords/thinking-processes","display_name":"Thinking processes","score":0.27410000562667847},{"id":"https://openalex.org/keywords/pie-chart","display_name":"Pie chart","score":0.2538999915122986}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6517999768257141},{"id":"https://openalex.org/C190812933","wikidata":"https://www.wikidata.org/wiki/Q28923","display_name":"Chart","level":2,"score":0.6299999952316284},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41690000891685486},{"id":"https://openalex.org/C196985124","wikidata":"https://www.wikidata.org/wiki/Q1369242","display_name":"Control chart","level":3,"score":0.357699990272522},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29490000009536743},{"id":"https://openalex.org/C187179951","wikidata":"https://www.wikidata.org/wiki/Q7784616","display_name":"Thinking processes","level":3,"score":0.27410000562667847},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2669999897480011},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.258899986743927},{"id":"https://openalex.org/C205208641","wikidata":"https://www.wikidata.org/wiki/Q273404","display_name":"Pie chart","level":2,"score":0.2538999915122986},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2506999969482422},{"id":"https://openalex.org/C199639397","wikidata":"https://www.wikidata.org/wiki/Q1788588","display_name":"Engineering drawing","level":1,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.neucom.2026.133935","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.neucom.2026.133935","pdf_url":null,"source":{"id":"https://openalex.org/S45693802","display_name":"Neurocomputing","issn_l":"0925-2312","issn":["0925-2312","1872-8286"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neurocomputing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.neucom.2026.133935","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.neucom.2026.133935","pdf_url":null,"source":{"id":"https://openalex.org/S45693802","display_name":"Neurocomputing","issn_l":"0925-2312","issn":["0925-2312","1872-8286"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neurocomputing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Answering":[0],"questions":[1],"about":[2],"charts":[3,15],"presents":[4],"a":[5,41,58,64,91,182,211,245],"unique":[6],"challenge":[7],"for":[8,175,188,313],"Vision-Language":[9],"Models":[10],"(VLMs).":[11],"Unlike":[12],"natural":[13],"images,":[14],"are":[16],"structured":[17,176,203,296],"artifacts":[18],"governed":[19],"by":[20],"explicit":[21,291],"visual":[22,29,52,74,166,177,196,220,292,297],"grammar":[23],"that":[24,60,67,163,214,290],"demands":[25],"pixel-level":[26],"accuracy":[27,139,272],"in":[28,185],"perception.":[30],"While":[31],"recent":[32],"VLMs":[33,187],"demonstrate":[34],"impressive":[35],"reasoning":[36,46,65,111,174,191,212,255],"abilities":[37],"on":[38,103,135,148,251,273,283],"chart":[39,189,236,305],"tasks,":[40],"critical":[42,183],"gap":[43,184],"remains:":[44],"their":[45],"operates":[47,192],"abstractly,":[48],"disconnected":[49],"from":[50,140,202],"precise":[51,195,314],"grounding.":[53],"We":[54,180,206,240],"introduce":[55,241],"Active":[56,130,267],"Perception,":[57],"framework":[59],"enables":[61],"Gaze-Guided":[62,208],"Thinking,":[63],"pattern":[66,213],"explicitly":[68],"anchors":[69,215],"abstract":[70,216],"inference":[71,217],"to":[72,142,154,218,260],"concrete":[73,219],"locations":[75,221],"through":[76,222],"coordinate-based":[77],"operations":[78],"(Locate,":[79],"Trace,":[80],"Extract,":[81],"Compare).":[82],"To":[83],"instill":[84],"this":[85],"capability,":[86],"we":[87],"propose":[88,207],"Skill":[89,242],"Cultivation,":[90],"two-stage":[92,246],"training":[93,247],"strategy:":[94],"Stage":[95,113],"I":[96],"injects":[97],"coordinate-aware":[98],"primitives":[99],"via":[100,121],"Supervised":[101],"Fine-Tuning":[102],"ChartQAGaze-14K,":[104],"our":[105],"synthesized":[106],"dataset":[107],"of":[108,171],"14K":[109],"coordinate-annotated":[110,254],"chains;":[112],"II":[114],"internalizes":[115],"these":[116],"skills":[117],"into":[118],"adaptive":[119],"strategies":[120],"Reinforcement":[122],"Learning":[123],"with":[124,144,257,279],"outcome-based":[125,258],"rewards.":[126],"Building":[127],"upon":[128],"Qwen2.5-VL-7B,":[129],"Perception":[131,268],"achieves":[132,269],"state-of-the-art":[133],"performance":[134,282],"ChartQA,":[136],"improving":[137],"overall":[138,271],"78.96%":[141],"82.44%,":[143],"particularly":[145,280],"notable":[146],"gains":[147],"the":[149,169,284],"challenging":[150],"Human":[151,285],"split":[152,286],"(75.76%":[153],"81.28%).":[155],"Qualitative":[156,300],"analysis":[157,301],"reveals":[158,302],"emergent":[159,303],"systematic":[160],"chart-reading":[161],"behaviors":[162],"mirror":[164],"human":[165,235],"strategies,":[167],"demonstrating":[168,289],"effectiveness":[170],"spatially":[172],"grounded":[173],"understanding.":[178,298],"\u2022":[179,205,239,266,299],"identify":[181],"current":[186],"understanding:":[190],"abstractly":[193],"without":[194],"grounding,":[197],"limiting":[198],"accurate":[199],"data":[200],"extraction":[201,316],"visualizations.":[204],"Thinking":[209],",":[210,227,229,231,244],"Coordinate":[223],"Primitives":[224],"(":[225],"Locate":[226],"Trace":[228],"Extract":[230],"Compare":[232],"),":[233],"mimicking":[234],"scanning":[237],"behavior.":[238],"Cultivation":[243],"strategy":[248],"combining":[249],"SFT":[250],"ChartQAGaze-14K":[252],"(14K":[253],"chains)":[256],"RL":[259],"inject":[261],"and":[262,317],"internalize":[263],"spatially-grounded":[264],"reasoning.":[265,319],"82.44%":[270],"ChartQA":[274],"(a":[275],"3.48%":[276],"absolute":[277],"improvement),":[278],"strong":[281],"(81.28%,":[287],"+5.52%),":[288],"grounding":[293],"substantially":[294],"enhances":[295],"human-like":[304],"reading":[306],"behaviors,":[307],"where":[308],"models":[309],"systematically":[310],"leverage":[311],"coordinates":[312],"value":[315],"spatial":[318]},"counts_by_year":[],"updated_date":"2026-05-23T06:10:36.450269","created_date":"2026-05-15T00:00:00"}
