{"id":"https://openalex.org/W7164827911","doi":"https://doi.org/10.1145/3805622.3810576","title":"PSRNet: Progressive Semantic Refinement for Human Parsing via Text Conditioning and Embedding-Based Calibration","display_name":"PSRNet: Progressive Semantic Refinement for Human Parsing via Text Conditioning and Embedding-Based Calibration","publication_year":2026,"publication_date":"2026-06-15","ids":{"openalex":"https://openalex.org/W7164827911","doi":"https://doi.org/10.1145/3805622.3810576"},"language":null,"primary_location":{"id":"doi:10.1145/3805622.3810576","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810576","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3805622.3810576","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053668695","display_name":"Ming Meng","orcid":"https://orcid.org/0000-0002-3711-3821"},"institutions":[{"id":"https://openalex.org/I75689368","display_name":"Communication University of China","ror":"https://ror.org/04facbs33","country_code":"CN","type":"education","lineage":["https://openalex.org/I75689368"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ming Meng","raw_affiliation_strings":["School of Data Science and Intelligent Media, Communication University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3711-3821","affiliations":[{"raw_affiliation_string":"School of Data Science and Intelligent Media, Communication University of China, Beijing, China","institution_ids":["https://openalex.org/I75689368"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130919553","display_name":"Hanwen Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I20942203","display_name":"Hainan University","ror":"https://ror.org/03q648j11","country_code":"CN","type":"education","lineage":["https://openalex.org/I20942203"]},{"id":"https://openalex.org/I75689368","display_name":"Communication University of China","ror":"https://ror.org/04facbs33","country_code":"CN","type":"education","lineage":["https://openalex.org/I75689368"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hanwen Liu","raw_affiliation_strings":["Hainan International College, Communication University of China, Hainan, China"],"raw_orcid":"https://orcid.org/0009-0003-6271-5239","affiliations":[{"raw_affiliation_string":"Hainan International College, Communication University of China, Hainan, China","institution_ids":["https://openalex.org/I20942203","https://openalex.org/I75689368"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5138664493","display_name":"Xingxing Xiang","orcid":"https://orcid.org/0009-0001-7181-7574"},"institutions":[{"id":"https://openalex.org/I146563203","display_name":"University of International Business and Economics","ror":"https://ror.org/05khqpb71","country_code":"CN","type":"education","lineage":["https://openalex.org/I146563203"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingxing Xiang","raw_affiliation_strings":["School of International Business, University of International Business and Economics, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0001-7181-7574","affiliations":[{"raw_affiliation_string":"School of International Business, University of International Business and Economics, Beijing, China","institution_ids":["https://openalex.org/I146563203"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100600271","display_name":"Long Ye","orcid":"https://orcid.org/0000-0002-3562-5612"},"institutions":[{"id":"https://openalex.org/I75689368","display_name":"Communication University of China","ror":"https://ror.org/04facbs33","country_code":"CN","type":"education","lineage":["https://openalex.org/I75689368"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Long Ye","raw_affiliation_strings":["School of Data Science and Intelligent Media, Communication University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3562-5612","affiliations":[{"raw_affiliation_string":"School of Data Science and Intelligent Media, Communication University of China, Beijing, China","institution_ids":["https://openalex.org/I75689368"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060498902","display_name":"Lei Zhang","orcid":"https://orcid.org/0000-0003-3689-6868"},"institutions":[{"id":"https://openalex.org/I179026463","display_name":"Beijing Technology and Business University","ror":"https://ror.org/013e0zm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I179026463"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Zhang","raw_affiliation_strings":["School of Computer and Artificial Intelligence, Beijing Technology and Business University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-3689-6868","affiliations":[{"raw_affiliation_string":"School of Computer and Artificial Intelligence, Beijing Technology and Business University, Beijing, China","institution_ids":["https://openalex.org/I179026463"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021141988","display_name":"Zhaoxin Fan","orcid":"https://orcid.org/0000-0002-6324-1712"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhaoxin Fan","raw_affiliation_strings":["Beijing Advanced Innovation Center for Future Blockchain and Privacy Computing, Beihang University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-6324-1712","affiliations":[{"raw_affiliation_string":"Beijing Advanced Innovation Center for Future Blockchain and Privacy Computing, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.94803946,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1222","last_page":"1230"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.46209999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.46209999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.0869000032544136,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.05460000038146973,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.7685999870300293},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.6284000277519226},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5498999953269958},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4832000136375427},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.4523000121116638},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4325999915599823},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.40139999985694885},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.3644999861717224}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7950999736785889},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.7685999870300293},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6575999855995178},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.6284000277519226},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5989000201225281},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5498999953269958},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4832000136375427},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.4523000121116638},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4325999915599823},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.40139999985694885},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3644999861717224},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3617999851703644},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.3589000105857849},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.34450000524520874},{"id":"https://openalex.org/C17231256","wikidata":"https://www.wikidata.org/wiki/Q5156540","display_name":"Completeness (order theory)","level":2,"score":0.3434000015258789},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.3287999927997589},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.31029999256134033},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.296999990940094},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.2969000041484833},{"id":"https://openalex.org/C2781140086","wikidata":"https://www.wikidata.org/wiki/Q557945","display_name":"Confusion","level":2,"score":0.2874000072479248},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.2833000123500824},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.2800000011920929},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.26409998536109924}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3805622.3810576","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810576","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3805622.3810576","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3805622.3810576","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.7580681443214417,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1903029394","https://openalex.org/W2194775991","https://openalex.org/W2412782625","https://openalex.org/W2560023338","https://openalex.org/W2598915960","https://openalex.org/W2737682710","https://openalex.org/W2883779225","https://openalex.org/W2886799640","https://openalex.org/W2924485953","https://openalex.org/W2962891704","https://openalex.org/W2963578952","https://openalex.org/W2964072977","https://openalex.org/W2964252655","https://openalex.org/W2964309882","https://openalex.org/W2981959899","https://openalex.org/W3009224666","https://openalex.org/W3034230284","https://openalex.org/W3034509543","https://openalex.org/W3034760601","https://openalex.org/W3108326630","https://openalex.org/W3108657013","https://openalex.org/W3195135988","https://openalex.org/W3198020043","https://openalex.org/W4226030517","https://openalex.org/W4226058394","https://openalex.org/W4289745225","https://openalex.org/W4292964465","https://openalex.org/W4312420092","https://openalex.org/W4312815172","https://openalex.org/W4312980231","https://openalex.org/W4386076305","https://openalex.org/W4386076618","https://openalex.org/W4391878209","https://openalex.org/W4392615480","https://openalex.org/W4404172003","https://openalex.org/W4409262755","https://openalex.org/W4413079717","https://openalex.org/W4413145645"],"related_works":[],"abstract_inverted_index":{"Human":[0],"parsing":[1,45,142],"requires":[2],"fine-grained,":[3],"pixel-level":[4],"delineation":[5],"of":[6],"human":[7],"parts":[8,17],"and":[9,15,22,74,116,121,134,144],"accessories,":[10],"yet":[11],"visually":[12],"correlated":[13],"categories":[14],"long-tailed":[16],"often":[18],"cause":[19],"semantic":[20,37],"confusion":[21],"boundary":[23,109,145],"ambiguity.":[24],"We":[25],"propose":[26],"PSRNet,":[27],"a":[28,47,51,71,79,101],"Progressive":[29],"Semantic":[30],"Refinement":[31,104],"Network":[32],"that":[33,107,137],"exploits":[34],"fixed":[35],"class":[36,58],"embeddings":[38],"derived":[39],"from":[40],"category":[41,89],"text":[42],"to":[43,60,87],"refine":[44],"in":[46],"coarse-to-fine":[48],"manner.":[49],"First,":[50],"Text-Conditioned":[52],"Feature":[53],"Modulation":[54],"(TCFM)":[55],"module":[56,77],"injects":[57],"semantics":[59],"modulate":[61],"encoder":[62],"features,":[63],"enhancing":[64],"low-level":[65],"discriminability":[66],"for":[67],"confusing":[68,155],"parts.":[69],"Second,":[70],"Semantic-Embedding":[72],"Calibration":[73],"Fusion":[75],"(SECF)":[76],"combines":[78],"conventional":[80],"linear":[81],"classifier":[82],"with":[83,150],"an":[84],"embedding-similarity":[85],"head":[86],"calibrate":[88],"logits,":[90],"effectively":[91],"reducing":[92],"misclassification":[93],"among":[94],"semantically":[95],"close":[96],"classes.":[97],"Third,":[98],"we":[99],"introduce":[100],"Morphology-Guided":[102],"Boundary":[103],"loss":[105],"(MGBR)":[106],"constructs":[108],"supervision":[110],"via":[111],"dilation\u2013erosion":[112],"operations":[113],"on":[114,128,154],"predictions":[115],"ground":[117],"truth,":[118],"encouraging":[119],"sharper":[120],"more":[122],"consistent":[123],"part":[124,156],"boundaries.":[125],"Extensive":[126],"experiments":[127],"two":[129],"widely":[130],"used":[131],"benchmarks,":[132],"LIP":[133],"CIHP,":[135],"demonstrate":[136],"PSRNet":[138],"consistently":[139],"improves":[140],"both":[141],"accuracy":[143],"quality":[146],"over":[147],"strong":[148],"baselines,":[149],"particularly":[151],"notable":[152],"gains":[153],"pairs.":[157]},"counts_by_year":[],"updated_date":"2026-06-16T07:37:23.134862","created_date":"2026-06-16T00:00:00"}
