{"id":"https://openalex.org/W7158250005","doi":"https://doi.org/10.48550/arxiv.2604.25839","title":"Break the Inaccessible Boundary: Distilling Post-Conversion Content for User Retention Modeling","display_name":"Break the Inaccessible Boundary: Distilling Post-Conversion Content for User Retention Modeling","publication_year":2026,"publication_date":"2026-04-28","ids":{"openalex":"https://openalex.org/W7158250005","doi":"https://doi.org/10.48550/arxiv.2604.25839"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.25839","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25839","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.25839","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100822935","display_name":"Tianbao Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ma, Tianbao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041679814","display_name":"Ruochen Yang","orcid":"https://orcid.org/0000-0002-5468-9638"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Ruochen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134832669","display_name":"Chengen Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chengen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132735308","display_name":"Yuexin Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Yuexin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134838286","display_name":"Jiangxia Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Jiangxia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035034659","display_name":"Linxun Chen","orcid":"https://orcid.org/0000-0003-3764-737X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Linxun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134840307","display_name":"Zhaojie Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Zhaojie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134824125","display_name":"Yanan Niu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Niu, Yanan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134854992","display_name":"Han Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Han","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134854358","display_name":"Kun Gai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gai, Kun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5100822935"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.4230000078678131,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.4230000078678131,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.12530000507831573,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11161","display_name":"Consumer Market Behavior and Pricing","score":0.06669999659061432,"subfield":{"id":"https://openalex.org/subfields/1406","display_name":"Marketing"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/onboarding","display_name":"Onboarding","score":0.9369000196456909},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.7465000152587891},{"id":"https://openalex.org/keywords/bidding","display_name":"Bidding","score":0.7402999997138977},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4713999927043915},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.4309999942779541},{"id":"https://openalex.org/keywords/content","display_name":"Content (measure theory)","score":0.4059000015258789},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.40400001406669617},{"id":"https://openalex.org/keywords/user-engagement","display_name":"User engagement","score":0.359499990940094}],"concepts":[{"id":"https://openalex.org/C2779185108","wikidata":"https://www.wikidata.org/wiki/Q7091744","display_name":"Onboarding","level":2,"score":0.9369000196456909},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.7465000152587891},{"id":"https://openalex.org/C9233905","wikidata":"https://www.wikidata.org/wiki/Q3276328","display_name":"Bidding","level":2,"score":0.7402999997138977},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7026000022888184},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4713999927043915},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.4309999942779541},{"id":"https://openalex.org/C2778152352","wikidata":"https://www.wikidata.org/wiki/Q5165061","display_name":"Content (measure theory)","level":2,"score":0.4059000015258789},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.40400001406669617},{"id":"https://openalex.org/C2984870255","wikidata":"https://www.wikidata.org/wiki/Q5196451","display_name":"User engagement","level":2,"score":0.359499990940094},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.3587000072002411},{"id":"https://openalex.org/C159023312","wikidata":"https://www.wikidata.org/wiki/Q409513","display_name":"NOP","level":3,"score":0.34950000047683716},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.30329999327659607},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.29499998688697815},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.2896000146865845},{"id":"https://openalex.org/C101293273","wikidata":"https://www.wikidata.org/wiki/Q579716","display_name":"User-generated content","level":3,"score":0.2888999879360199},{"id":"https://openalex.org/C91262260","wikidata":"https://www.wikidata.org/wiki/Q528074","display_name":"End user","level":2,"score":0.27869999408721924},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.2727000117301941},{"id":"https://openalex.org/C3020234875","wikidata":"https://www.wikidata.org/wiki/Q1260632","display_name":"Media content","level":2,"score":0.27230000495910645},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.2556999921798706}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.25839","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25839","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.25839","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.25839","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"User":[0],"retention":[1,23,54],"is":[2,25,129],"a":[3,67,80,115,126,163],"key":[4],"metric":[5],"to":[6,27,93,113,140],"measure":[7],"long-term":[8],"engagement":[9],"in":[10,59,162],"modern":[11],"platforms.":[12],"In":[13,104,122],"real-time":[14],"bidding":[15,33],"(RTB)":[16],"advertising":[17],"system":[18],"for":[19,53,84],"user":[20,37,127],"re-engagement,":[21],"the":[22,36,91,105,123,132,138,142],"model":[24,92,139],"required":[26],"predict":[28],"future":[29,96],"revisit":[30],"probability":[31],"at":[32],"time,":[34],"before":[35],"converts":[38],"and":[39,65,71,151],"consumes":[40],"any":[41],"content.":[42],"Although":[43],"post-conversion":[44],"content,":[45],"termed":[46],"Onboarding":[47,85],"Content,":[48],"provides":[49],"highly":[50],"informative":[51],"signals":[52,145],"prediction,":[55],"directly":[56],"using":[57,98],"it":[58],"training":[60,70],"causes":[61],"severe":[62],"feature":[63],"leakage":[64],"creates":[66],"gap":[68],"between":[69],"serving.":[72],"To":[73],"address":[74],"this":[75],"issue,":[76],"we":[77,108],"propose":[78],"OCARM,":[79],"two-stage":[81],"distillation-aligned":[82],"framework":[83,158],"Content":[86],"Augmented":[87],"Retention":[88],"Modeling,":[89],"enabling":[90],"implicitly":[94],"capture":[95],"content":[97,112],"only":[99],"observable":[100],"features":[101],"during":[102],"inference.":[103],"first":[106],"stage,":[107,125],"deliberately":[109],"expose":[110],"onboarding":[111,144],"train":[114],"hierarchical":[116],"encoder":[117,128],"that":[118,156],"produces":[119],"teacher":[120,134],"representations.":[121],"second":[124],"aligned":[130],"with":[131],"frozen":[133],"through":[135],"distillation,":[136],"allowing":[137],"approximate":[141],"inaccessible":[143],"without":[146],"leakage.":[147],"Extensive":[148],"offline":[149],"experiments":[150],"online":[152],"A/B":[153],"tests":[154],"demonstrate":[155],"our":[157],"achieves":[159],"consistent":[160],"improvements":[161],"real-world":[164],"growth":[165],"scenario.":[166]},"counts_by_year":[],"updated_date":"2026-04-30T06:11:10.768123","created_date":"2026-04-30T00:00:00"}
