{"id":"https://openalex.org/W4396757493","doi":"https://doi.org/10.1145/3589334.3645711","title":"Understanding Human Preferences: Towards More Personalized Video to Text Generation","display_name":"Understanding Human Preferences: Towards More Personalized Video to Text Generation","publication_year":2024,"publication_date":"2024-05-08","ids":{"openalex":"https://openalex.org/W4396757493","doi":"https://doi.org/10.1145/3589334.3645711"},"language":"en","primary_location":{"id":"doi:10.1145/3589334.3645711","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3589334.3645711","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2024","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010596810","display_name":"Yihan Wu","orcid":"https://orcid.org/0009-0001-0312-782X"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yihan Wu","raw_affiliation_strings":["Gaoling School of Artificial Intelligence, Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0001-0312-782X","affiliations":[{"raw_affiliation_string":"Gaoling School of Artificial Intelligence, Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101505571","display_name":"Ruihua Song","orcid":"https://orcid.org/0000-0002-2163-7401"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruihua Song","raw_affiliation_strings":["Gaoling School of Artificial Intelligence, Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-2163-7401","affiliations":[{"raw_affiliation_string":"Gaoling School of Artificial Intelligence, Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101755392","display_name":"Xu Chen","orcid":"https://orcid.org/0000-0003-0144-1775"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Chen","raw_affiliation_strings":["Gaoling School of Artificial Intelligence, Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-0144-1775","affiliations":[{"raw_affiliation_string":"Gaoling School of Artificial Intelligence, Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002846606","display_name":"Hao Jiang","orcid":"https://orcid.org/0000-0002-2306-7596"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Jiang","raw_affiliation_strings":["Poisson Lab, Huawei, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-2306-7596","affiliations":[{"raw_affiliation_string":"Poisson Lab, Huawei, Beijing, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000839824","display_name":"Zhao Cao","orcid":"https://orcid.org/0000-0002-4214-7858"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhao Cao","raw_affiliation_strings":["Poisson Lab, Huawei, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-4214-7858","affiliations":[{"raw_affiliation_string":"Poisson Lab, Huawei, Beijing, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101403770","display_name":"Jin Yu","orcid":"https://orcid.org/0000-0002-3371-6609"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Yu","raw_affiliation_strings":["Poisson Lab, Huawei, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3371-6609","affiliations":[{"raw_affiliation_string":"Poisson Lab, Huawei, Beijing, China","institution_ids":["https://openalex.org/I2250955327"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5010596810"],"corresponding_institution_ids":["https://openalex.org/I78988378"],"apc_list":null,"apc_paid":null,"fwci":0.4762,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.60733643,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"3952","last_page":"3963"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.683940052986145},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.40508487820625305},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3642926514148712},{"id":"https://openalex.org/keywords/internet-privacy","display_name":"Internet privacy","score":0.3406113386154175}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.683940052986145},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.40508487820625305},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3642926514148712},{"id":"https://openalex.org/C108827166","wikidata":"https://www.wikidata.org/wiki/Q175975","display_name":"Internet privacy","level":1,"score":0.3406113386154175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3589334.3645711","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3589334.3645711","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2024","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7883544670","display_name":null,"funder_award_id":"62276268","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"}],"funders":[{"id":"https://openalex.org/F4320323817","display_name":"Universitas Brawijaya","ror":"https://ror.org/01wk3d929"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1956340063","https://openalex.org/W1981780064","https://openalex.org/W2028485238","https://openalex.org/W2046281687","https://openalex.org/W2101105183","https://openalex.org/W2108598243","https://openalex.org/W2133459682","https://openalex.org/W2560674852","https://openalex.org/W2583875861","https://openalex.org/W2607579284","https://openalex.org/W2740409734","https://openalex.org/W2747329762","https://openalex.org/W2765716052","https://openalex.org/W2798331900","https://openalex.org/W2893085659","https://openalex.org/W2954199749","https://openalex.org/W2962944176","https://openalex.org/W2964258748","https://openalex.org/W2964512901","https://openalex.org/W2982260276","https://openalex.org/W2998409107","https://openalex.org/W3005527857","https://openalex.org/W3034815696","https://openalex.org/W3035365026","https://openalex.org/W3093187109","https://openalex.org/W3101422495","https://openalex.org/W3161135883","https://openalex.org/W3167057046","https://openalex.org/W3208227120","https://openalex.org/W3217340782","https://openalex.org/W4200476698","https://openalex.org/W4211186029","https://openalex.org/W4318620058","https://openalex.org/W4318718936"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"While":[0],"previous":[1],"video":[2,18,59,73,94,238],"to":[3,15,26,177,203,218,239,257],"text":[4,173,240],"models":[5],"have":[6],"achieved":[7],"remarkable":[8],"successes,":[9],"they":[10],"mostly":[11],"focus":[12],"on":[13,114,143,182],"how":[14],"understand":[16],"the":[17,28,69,91,107,120,158,161,166,179,183,188,220,223,230,234,259],"contents":[19],"in":[20,45,54,100,165,199,229],"a":[21,57,150,172,246],"general":[22],"sense,":[23],"but":[24],"fail":[25],"capture":[27],"human":[29],"personalized":[30,72,80,237],"preferences,":[31],"which":[32,153,175],"is":[33,49,61,149,154,171],"highly":[34],"demanded":[35],"for":[36,82,93,106,119,156,249],"an":[37,78,200],"engaging":[38],"multimodal":[39],"chatbots.":[40],"Different":[41],"from":[42],"user":[43,52,162],"modeling":[44],"collaborative":[46],"filtering,":[47],"there":[48],"no":[50],"other":[51],"behaviors":[53],"inference":[55,216,231],"as":[56],"real-time":[58],"stream":[60],"coming.":[62],"In":[63,86,191],"this":[64,84,251],"paper,":[65],"we":[66,88,138,209,242],"formally":[67],"define":[68],"task":[70,75],"of":[71,236,261],"commenting":[74],"and":[76,117,187,214,244],"design":[77,139,210],"end-to-end":[79,201],"framework":[81,141],"solving":[83],"task.":[85],"specific,":[87],"argue":[89],"that":[90,103,160,222],"personalization":[92],"comment":[95,113,164,180],"generation":[96],"can":[97],"be":[98],"reflected":[99],"two":[101,144,195],"aspects,":[102],"is,":[104],"(1)":[105],"same":[108,121],"video,":[109],"different":[110,115,123],"users":[111],"may":[112,125,163],"clips,":[116],"(2)":[118],"clip,":[122],"people":[124],"also":[126],"express":[127],"various":[128],"opinions":[129],"with":[130],"diverse":[131],"commentary":[132],"styles.":[133],"Motivated":[134],"by":[135],"these":[136,194],"considerations,":[137],"our":[140,192,262],"based":[142,181],"components.":[145],"The":[146,168],"first":[147],"one":[148,170],"clip":[151],"selector,":[152],"responsible":[155],"predicting":[157],"clips":[159,186,226],"video.":[167],"second":[169],"generator,":[174],"aims":[176],"produce":[178],"above":[184],"predicted":[185],"user's":[189],"preference.":[190],"framework,":[193],"components":[196],"are":[197,227],"optimized":[198],"manner":[202],"mutually":[204],"enhance":[205],"each":[206],"other,":[207],"where":[208],"confidence-aware":[211],"scheduled":[212],"sampling":[213],"iterative":[215],"strategies":[217],"solve":[219],"problem":[221],"ground":[224],"truth":[225],"absent":[228],"phase.":[232],"As":[233],"absence":[235],"dataset,":[241],"collect":[243],"release":[245],"new":[247],"dataset":[248],"studying":[250],"problem.":[252],"We":[253],"conduct":[254],"extensive":[255],"experiments":[256],"demonstrate":[258],"effectiveness":[260],"model.":[263]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
