{"id":"https://openalex.org/W4402353739","doi":"https://doi.org/10.1109/ijcnn60899.2024.10650958","title":"HGSVerb: Improving Zero-shot Text Classification via Hierarchical Generative Semantic-Aware Verbalizer","display_name":"HGSVerb: Improving Zero-shot Text Classification via Hierarchical Generative Semantic-Aware Verbalizer","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4402353739","doi":"https://doi.org/10.1109/ijcnn60899.2024.10650958"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn60899.2024.10650958","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10650958","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103139071","display_name":"Zifeng Liu","orcid":"https://orcid.org/0000-0002-1392-8698"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zifeng Liu","raw_affiliation_strings":["Wuhan University,School of Computer Science,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Computer Science,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065515283","display_name":"Xu Huang","orcid":"https://orcid.org/0000-0003-3797-6042"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Huang","raw_affiliation_strings":["Wuhan University,School of Computer Science,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Computer Science,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056336684","display_name":"Weipeng Chen","orcid":"https://orcid.org/0000-0001-9293-7578"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weipeng Chen","raw_affiliation_strings":["Wuhan University,School of Computer Science,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Computer Science,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100327072","display_name":"Jin Liu","orcid":"https://orcid.org/0000-0003-0359-0248"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Liu","raw_affiliation_strings":["Wuhan University,School of Computer Science,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Computer Science,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103139071"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1298909,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"21","issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7562679052352905},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6614941954612732},{"id":"https://openalex.org/keywords/zero","display_name":"Zero (linguistics)","score":0.6088089346885681},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.5756054520606995},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5491424798965454},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.47786659002304077},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.07101574540138245},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.05563920736312866}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7562679052352905},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6614941954612732},{"id":"https://openalex.org/C2780813799","wikidata":"https://www.wikidata.org/wiki/Q3274237","display_name":"Zero (linguistics)","level":2,"score":0.6088089346885681},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.5756054520606995},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5491424798965454},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.47786659002304077},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.07101574540138245},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.05563920736312866},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C191897082","wikidata":"https://www.wikidata.org/wiki/Q11467","display_name":"Metallurgy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn60899.2024.10650958","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10650958","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.4699999988079071,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1552847225","https://openalex.org/W2061873838","https://openalex.org/W2163455955","https://openalex.org/W2170240176","https://openalex.org/W2891575196","https://openalex.org/W2937423263","https://openalex.org/W2963341956","https://openalex.org/W2963748441","https://openalex.org/W2965373594","https://openalex.org/W2970200208","https://openalex.org/W2970476646","https://openalex.org/W3034999214","https://openalex.org/W3098267758","https://openalex.org/W3105625590","https://openalex.org/W3106109117","https://openalex.org/W3153427360","https://openalex.org/W3166913490","https://openalex.org/W3173777717","https://openalex.org/W3174784402","https://openalex.org/W3188542058","https://openalex.org/W3210129272","https://openalex.org/W4237040408","https://openalex.org/W4288089799","https://openalex.org/W4288351520","https://openalex.org/W4292779060","https://openalex.org/W4309811444","https://openalex.org/W4385571571","https://openalex.org/W4385572905","https://openalex.org/W4385573679","https://openalex.org/W4385574162","https://openalex.org/W6676984168","https://openalex.org/W6685053522","https://openalex.org/W6691459498","https://openalex.org/W6729938257","https://openalex.org/W6757635932","https://openalex.org/W6766673545","https://openalex.org/W6769627184","https://openalex.org/W6778883912","https://openalex.org/W6801016683","https://openalex.org/W6846979011"],"related_works":["https://openalex.org/W2074502265","https://openalex.org/W4214877189","https://openalex.org/W2773965352","https://openalex.org/W2381179799","https://openalex.org/W2980279061","https://openalex.org/W2334685461","https://openalex.org/W2366718574","https://openalex.org/W2359774528","https://openalex.org/W4298312966","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Prompt-based":[0],"methods":[1,195],"with":[2,120,206,219],"Pre-trained":[3],"Language":[4],"Models":[5],"(PLMs)":[6],"have":[7],"demonstrated":[8],"remarkable":[9],"zero-shot":[10,33,72,222],"performance":[11],"in":[12,52,63],"text":[13],"classification":[14,186],"tasks.":[15],"Among":[16],"these":[17],"methods,":[18],"verbalizers":[19],"are":[20],"employed":[21],"to":[22,141,155,167],"convert":[23],"model-predicted":[24],"vocabulary":[25],"logits":[26],"into":[27],"task-specific":[28],"labels.":[29],"However,":[30],"most":[31],"existing":[32,220],"approaches":[34],"face":[35],"several":[36],"challenges:":[37],"(1)":[38,81],"a":[39,57,69,84,105,118,128,151,164],"reliance":[40],"on":[41,133,181,204],"unlabeled":[42],"data":[43,54,111],"or":[44,112],"additional":[45],"knowledge":[46],"bases,":[47],"which":[48],"limits":[49],"their":[50],"effectiveness":[51],"varied":[53],"scenarios;":[55],"(2)":[56,125],"disregard":[58],"for":[59],"semantic":[60,134,144],"ambiguity":[61,145],"issues":[62],"verbalizer":[64,119,161],"construction.":[65],"This":[66],"paper":[67],"presents":[68],"novel":[70],"fully":[71,221],"approach":[73],"named":[74],"Hierarchical":[75,87,152],"Generative":[76,78],"Semantic-Aware":[77,129],"Verbalizer":[79,89],"(HGSVerb).":[80],"We":[82,126,178,199],"propose":[83,127],"prompt-based":[85],"module,":[86],"Semantic":[88],"Generation,":[90],"that":[91],"explores":[92],"the":[93,99,143,157,169,215],"full":[94],"utilization":[95,158],"of":[96,101,159,171,209],"PLMs":[97],"and":[98,123,139,184,188,211],"semantics":[100,122],"label":[102,137,172],"names.":[103],"As":[104],"result,":[106],"without":[107],"requiring":[108],"any":[109],"extra":[110,197],"knowledge,":[113],"our":[114,160,189],"model":[115],"iteratively":[116],"generates":[117],"hierarchical":[121],"structure.":[124],"Refinement":[130],"method":[131],"based":[132],"distance":[135],"between":[136],"words":[138,173],"categories":[140],"reduce":[142],"issue.":[146],"(3)":[147],"Additionally,":[148],"HGSVerb":[149,180,213],"introduces":[150],"Weight":[153],"Aggregation":[154],"optimize":[156],"by":[162,175],"using":[163],"decay":[165],"coefficient":[166],"distinguish":[168],"importance":[170],"generated":[174],"different":[176],"iterations.":[177],"evaluate":[179],"four":[182],"topic":[183],"sentiment":[185],"datasets,":[187],"average":[190],"accuracy":[191],"even":[192],"outperforms":[193],"those":[194],"utilizing":[196],"resources.":[198],"also":[200],"examine":[201],"its":[202],"transferability":[203],"datasets":[205],"diverse":[207],"numbers":[208],"classes":[210],"topics.":[212],"achieves":[214],"best":[216],"results":[217],"compared":[218],"methods.":[223]},"counts_by_year":[],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
