{"id":"https://openalex.org/W3112256745","doi":"https://doi.org/10.1109/access.2020.3042778","title":"Short Text Embedding Autoencoders With Attention-Based Neighborhood Preservation","display_name":"Short Text Embedding Autoencoders With Attention-Based Neighborhood Preservation","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3112256745","doi":"https://doi.org/10.1109/access.2020.3042778","mag":"3112256745"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.3042778","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3042778","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09284562.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09284562.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101419444","display_name":"Chao Wei","orcid":"https://orcid.org/0000-0002-3502-6951"},"institutions":[{"id":"https://openalex.org/I4210104311","display_name":"Institute of Scientific and Technical Information of China","ror":"https://ror.org/01b2av652","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210104311","https://openalex.org/I4210120069","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chao Wei","raw_affiliation_strings":["National Engineering Research Center of Science and Technology Information, Institute of Scientific and Technical Information of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center of Science and Technology Information, Institute of Scientific and Technical Information of China, Beijing, China","institution_ids":["https://openalex.org/I4210104311"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101410569","display_name":"Lijun Zhu","orcid":"https://orcid.org/0000-0002-7854-0424"},"institutions":[{"id":"https://openalex.org/I4210104311","display_name":"Institute of Scientific and Technical Information of China","ror":"https://ror.org/01b2av652","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210104311","https://openalex.org/I4210120069","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lijun Zhu","raw_affiliation_strings":["National Engineering Research Center of Science and Technology Information, Institute of Scientific and Technical Information of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center of Science and Technology Information, Institute of Scientific and Technical Information of China, Beijing, China","institution_ids":["https://openalex.org/I4210104311"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055427915","display_name":"Jiaoxiang Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210104311","display_name":"Institute of Scientific and Technical Information of China","ror":"https://ror.org/01b2av652","country_code":"CN","type":"government","lineage":["https://openalex.org/I4210104311","https://openalex.org/I4210120069","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaoxiang Shi","raw_affiliation_strings":["National Engineering Research Center of Science and Technology Information, Institute of Scientific and Technical Information of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center of Science and Technology Information, Institute of Scientific and Technical Information of China, Beijing, China","institution_ids":["https://openalex.org/I4210104311"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101419444"],"corresponding_institution_ids":["https://openalex.org/I4210104311"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.1326,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.56849268,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"8","issue":null,"first_page":"223156","last_page":"223171"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7280457019805908},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7062281966209412},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.6614386439323425},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6107192039489746},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6095457077026367},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.5823404788970947},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5703874230384827},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5661895275115967},{"id":"https://openalex.org/keywords/dimensionality-reduction","display_name":"Dimensionality reduction","score":0.5241725444793701},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.4671957492828369},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.4442245364189148},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.42826586961746216},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.3115062117576599}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7280457019805908},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7062281966209412},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.6614386439323425},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6107192039489746},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6095457077026367},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.5823404788970947},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5703874230384827},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5661895275115967},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.5241725444793701},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4671957492828369},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.4442245364189148},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.42826586961746216},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3115062117576599}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2020.3042778","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3042778","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09284562.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:3c1104285e7e4e50b16da8d79aa22d84","is_oa":true,"landing_page_url":"https://doaj.org/article/3c1104285e7e4e50b16da8d79aa22d84","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 223156-223171 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.3042778","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3042778","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09284562.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7300000190734863,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G1951943845","display_name":null,"funder_award_id":"2019M650804","funder_id":"https://openalex.org/F4320321543","funder_display_name":"China Postdoctoral Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320321543","display_name":"China Postdoctoral Science Foundation","ror":"https://ror.org/0426zh255"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3112256745.pdf","grobid_xml":"https://content.openalex.org/works/W3112256745.grobid-xml"},"referenced_works_count":66,"referenced_works":["https://openalex.org/W1491611863","https://openalex.org/W1880262756","https://openalex.org/W1965129197","https://openalex.org/W1970544520","https://openalex.org/W1977830790","https://openalex.org/W2001141328","https://openalex.org/W2042970394","https://openalex.org/W2048195127","https://openalex.org/W2053186076","https://openalex.org/W2072128103","https://openalex.org/W2088314245","https://openalex.org/W2100002341","https://openalex.org/W2107743791","https://openalex.org/W2110798204","https://openalex.org/W2112104211","https://openalex.org/W2140793251","https://openalex.org/W2141923507","https://openalex.org/W2145094598","https://openalex.org/W2153579005","https://openalex.org/W2156718197","https://openalex.org/W2157006255","https://openalex.org/W2163922914","https://openalex.org/W2168084958","https://openalex.org/W2171836785","https://openalex.org/W2187089797","https://openalex.org/W2218318129","https://openalex.org/W2252108544","https://openalex.org/W2267186426","https://openalex.org/W2288498609","https://openalex.org/W2462891382","https://openalex.org/W2507868973","https://openalex.org/W2516537890","https://openalex.org/W2575152338","https://openalex.org/W2576754561","https://openalex.org/W2586593666","https://openalex.org/W2741271950","https://openalex.org/W2777205766","https://openalex.org/W2884287800","https://openalex.org/W2887928931","https://openalex.org/W2913757497","https://openalex.org/W2963403868","https://openalex.org/W2969519670","https://openalex.org/W2969521304","https://openalex.org/W2971279492","https://openalex.org/W2991696912","https://openalex.org/W2995824694","https://openalex.org/W2997574889","https://openalex.org/W3005792683","https://openalex.org/W3011170682","https://openalex.org/W3035913193","https://openalex.org/W4231109964","https://openalex.org/W4231510805","https://openalex.org/W4233135949","https://openalex.org/W4294170691","https://openalex.org/W4385245566","https://openalex.org/W6629486361","https://openalex.org/W6639619044","https://openalex.org/W6674813771","https://openalex.org/W6676481782","https://openalex.org/W6680757391","https://openalex.org/W6681096077","https://openalex.org/W6682691769","https://openalex.org/W6682755970","https://openalex.org/W6683240801","https://openalex.org/W6688386640","https://openalex.org/W6739901393"],"related_works":["https://openalex.org/W4310873165","https://openalex.org/W2355395139","https://openalex.org/W2120164251","https://openalex.org/W4285596704","https://openalex.org/W2983142544","https://openalex.org/W2891059443","https://openalex.org/W4281663961","https://openalex.org/W3208888551","https://openalex.org/W4313561566","https://openalex.org/W3208386644"],"abstract_inverted_index":{"Shortness":[0],"and":[1,10,38,117,154,189,223],"sparsity":[2],"often":[3],"plague":[4],"short":[5,22,55,68,103,201,220],"text":[6,23,56,104,202,221],"representation":[7,24],"for":[8,165,192],"clustering":[9,222],"classification.":[11,224],"A":[12],"popular":[13],"solution":[14],"is":[15],"to":[16,62,85,99,178,185,233],"extract":[17,100],"meaningful":[18],"low-dimensional":[19,42,102,238],"embeddings":[20,43,135,193],"as":[21,35,147,184],"via":[25,111],"various":[26],"Dimensionality":[27],"Reduction":[28],"technology.":[29],"However,":[30],"the":[31,45,51,87,90,120,129,143,159,163,166,180,204,211,217,235],"existing":[32],"methods,":[33],"such":[34],"topic":[36],"models":[37],"neural":[39],"networks,":[40],"discover":[41],"from":[44,89],"whole":[46],"training":[47,95,139,167],"sets":[48],"without":[49],"considering":[50],"geometrical":[52,122],"information":[53],"of":[54,67,96,128,132,140,162,174,219,237],"manifold,":[57],"resulting":[58],"in":[59],"an":[60,112],"inability":[61],"provide":[63],"a":[64,75,93,126,137,148,171],"discriminative":[65,101,213],"embedding":[66],"text.":[69],"In":[70],"this":[71],"paper,":[72],"we":[73],"propose":[74],"manifold-regularized":[76],"method,":[77],"namely":[78],"Short":[79],"Texts":[80],"Embedding":[81],"AutoEncoders":[82,97],"(STE-AEs),":[83],"aiming":[84],"incorporate":[86],"semantics":[88,109],"neighborhood":[91,110],"into":[92,136],"regularization":[94,138],"(AEs)":[98],"embeddings.":[105,155,239],"STE-AEs":[106,169,208],"first":[107],"determines":[108],"attention-based":[113],"weighted":[114,130],"matching":[115],"distance":[116],"then":[118],"preserves":[119],"local":[121],"structure":[123],"by":[124],"incorporating":[125],"minimization":[127],"cross-entropy":[131],"nearby":[133],"texts'":[134],"AEs.":[141],"Finally,":[142],"encoder":[144,164],"can":[145,209,229],"act":[146],"parametrized":[149],"mapping":[150],"function":[151],"between":[152],"observations":[153],"Furthermore,":[156],"based":[157],"on":[158,198],"activation":[160],"values":[161],"set,":[168],"employs":[170],"regression":[172],"model":[173],"Random":[175],"Forest":[176],"(RF)":[177],"determine":[179],"feature":[181],"importance":[182],"so":[183],"find":[186],"certain":[187],"informative":[188],"readable":[190],"words":[191,228],"interpretation.":[194],"Through":[195],"extensive":[196],"experiments":[197],"three":[199],"real-world":[200],"corpuses,":[203],"evidence":[205],"demonstrate":[206],"that":[207],"capture":[210],"intrinsic":[212],"explanatory":[214],"factors,":[215],"improving":[216],"performance":[218],"Moreover,":[225],"some":[226],"understandable":[227],"be":[230],"efficiently":[231],"discovered":[232],"promote":[234],"interpretability":[236]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
