{"id":"https://openalex.org/W7118246252","doi":"https://doi.org/10.48550/arxiv.2601.00543","title":"ECR: Manifold-Guided Semantic Cues for Compact Language Models","display_name":"ECR: Manifold-Guided Semantic Cues for Compact Language Models","publication_year":2026,"publication_date":"2026-01-02","ids":{"openalex":"https://openalex.org/W7118246252","doi":"https://doi.org/10.48550/arxiv.2601.00543"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.00543","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00543","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.00543","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122219737","display_name":"Chung-Wei Victor Yuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yuan, Chung-Wei Victor","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5122219737"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.43799999356269836,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.43799999356269836,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.06639999896287918,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.05820000171661377,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6944000124931335},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.510200023651123},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4984000027179718},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4754999876022339},{"id":"https://openalex.org/keywords/projection","display_name":"Projection (relational algebra)","score":0.43459999561309814},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.41499999165534973},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.3837999999523163},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.36309999227523804},{"id":"https://openalex.org/keywords/compact-space","display_name":"Compact space","score":0.35850000381469727},{"id":"https://openalex.org/keywords/semantic-matching","display_name":"Semantic matching","score":0.35030001401901245}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7562999725341797},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6944000124931335},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.510200023651123},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4984000027179718},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4754999876022339},{"id":"https://openalex.org/C57493831","wikidata":"https://www.wikidata.org/wiki/Q3134666","display_name":"Projection (relational algebra)","level":2,"score":0.43459999561309814},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.41499999165534973},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4016000032424927},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38989999890327454},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.3837999999523163},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.36309999227523804},{"id":"https://openalex.org/C18648836","wikidata":"https://www.wikidata.org/wiki/Q381892","display_name":"Compact space","level":2,"score":0.35850000381469727},{"id":"https://openalex.org/C2778493491","wikidata":"https://www.wikidata.org/wiki/Q7449072","display_name":"Semantic matching","level":3,"score":0.35030001401901245},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3407000005245209},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.33570000529289246},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.3321000039577484},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.3303000032901764},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.32179999351501465},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3192000091075897},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.3181000053882599},{"id":"https://openalex.org/C529865628","wikidata":"https://www.wikidata.org/wiki/Q1790740","display_name":"Manifold (fluid mechanics)","level":2,"score":0.29989999532699585},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.2957000136375427},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.2948000133037567},{"id":"https://openalex.org/C198942812","wikidata":"https://www.wikidata.org/wiki/Q496618","display_name":"Semantic property","level":2,"score":0.29280000925064087},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.28610000014305115},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2833000123500824},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.27469998598098755},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.26669999957084656},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.26179999113082886},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.25780001282691956},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.2572999894618988},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.25220000743865967},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.00543","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00543","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.00543","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00543","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7947937846183777,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Compact":[0],"models":[1,181,211],"often":[2,61],"lose":[3],"the":[4,15,20,36,55,67,80,113,143],"structure":[5,164],"of":[6,103],"their":[7],"embedding":[8],"space.":[9],"The":[10],"issue":[11],"shows":[12],"up":[13],"when":[14],"capacity":[16],"is":[17,195],"tight":[18],"or":[19,129,146,225],"data":[21],"spans":[22],"several":[23],"languages.":[24,168],"Such":[25],"collapse":[26],"makes":[27,217],"it":[28],"difficult":[29],"for":[30],"downstream":[31],"tasks":[32,166],"to":[33,53,63,77,117,182,220],"build":[34],"on":[35,43,126,152],"resulting":[37],"representation.":[38],"Existing":[39],"compression":[40],"methods":[41],"focus":[42],"aligning":[44],"model":[45,115],"outputs":[46,193],"at":[47,139],"a":[48,89,101,135,153,172],"superficial":[49],"level":[50],"but":[51,198],"fail":[52],"preserve":[54],"underlying":[56],"manifold":[57],"structure.":[58],"This":[59,97],"mismatch":[60],"leads":[62],"semantic":[64,104,163],"drift":[65],"in":[66],"compact":[68,114,174,210],"model,":[69],"causing":[70],"both":[71],"task":[72,214],"behavior":[73],"and":[74,161,167,175,194,216],"linguistic":[75],"properties":[76],"deviate":[78],"from":[79,106],"reference":[81],"model.":[82],"To":[83],"address":[84],"those":[85],"issues,":[86],"we":[87],"provide":[88],"new":[90],"framework":[91,98],"called":[92],"Embedding":[93],"Consistency":[94],"Regulation":[95],"(ECR).":[96],"first":[99],"derives":[100],"set":[102],"anchors":[105],"teacher":[107,192],"embeddings":[108],"(computed":[109],"once":[110],"offline).":[111],"Then,":[112],"learns":[116],"maintain":[118],"consistent":[119],"geometry":[120],"around":[121],"these":[122],"anchors,":[123],"without":[124,141,191],"relying":[125],"matching":[127],"logits":[128],"internal":[130],"features.":[131],"ECR":[132,157,189,208],"adds":[133],"only":[134],"small":[136],"projection":[137],"step":[138],"inference,":[140],"altering":[142],"decoding":[144],"architecture":[145],"its":[147],"runtime":[148],"behavior.":[149],"In":[150],"experiments":[151],"100K":[154],"multilingual":[155],"corpus,":[156],"consistently":[158],"stabilizes":[159],"training":[160],"preserves":[162],"across":[165],"It":[169],"also":[170],"produces":[171],"more":[173],"task-aligned":[176],"representation":[177],"space,":[178],"enabling":[179],"low-capacity":[180],"learn":[183],"cleaner":[184],"manifolds":[185],"than":[186],"conventional":[187],"baselines.":[188],"works":[190],"compatible":[196],"with,":[197],"independent":[199],"of,":[200],"distillation.":[201],"Taken":[202],"together,":[203],"our":[204],"results":[205],"show":[206],"that":[207],"helps":[209],"better":[212],"follow":[213],"requirements":[215],"them":[218],"easier":[219],"deploy":[221],"under":[222],"strict":[223],"efficiency":[224],"privacy":[226],"limits.":[227]},"counts_by_year":[],"updated_date":"2026-01-08T20:10:11.968330","created_date":"2026-01-08T00:00:00"}
