{"id":"https://openalex.org/W4391331168","doi":"https://doi.org/10.1109/smc53992.2023.10394665","title":"A Quantitative Analysis of Noise Impact on Document Ranking","display_name":"A Quantitative Analysis of Noise Impact on Document Ranking","publication_year":2023,"publication_date":"2023-10-01","ids":{"openalex":"https://openalex.org/W4391331168","doi":"https://doi.org/10.1109/smc53992.2023.10394665"},"language":"en","primary_location":{"id":"doi:10.1109/smc53992.2023.10394665","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc53992.2023.10394665","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hal.science/hal-04284004/document","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031075054","display_name":"Edward Giamphy","orcid":null},"institutions":[{"id":"https://openalex.org/I4210115909","display_name":"Mutuelle G\u00e9n\u00e9rale de l'\u00c9ducation Nationale","ror":"https://ror.org/029vj4k86","country_code":"FR","type":"nonprofit","lineage":["https://openalex.org/I4210115909"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Edward Giamphy","raw_affiliation_strings":["Preligens and L3i,Paris,FRANCE","Preligens and L3i, Paris, FRANCE"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Preligens and L3i,Paris,FRANCE","institution_ids":["https://openalex.org/I4210115909"]},{"raw_affiliation_string":"Preligens and L3i, Paris, FRANCE","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070059933","display_name":"Kevin Sanchis","orcid":null},"institutions":[{"id":"https://openalex.org/I4210115909","display_name":"Mutuelle G\u00e9n\u00e9rale de l'\u00c9ducation Nationale","ror":"https://ror.org/029vj4k86","country_code":"FR","type":"nonprofit","lineage":["https://openalex.org/I4210115909"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Kevin Sanchis","raw_affiliation_strings":["Preligens,Paris,FRANCE","Preligens, Paris, FRANCE"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Preligens,Paris,FRANCE","institution_ids":["https://openalex.org/I4210115909"]},{"raw_affiliation_string":"Preligens, Paris, FRANCE","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035793542","display_name":"Gohar Dashyan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210115909","display_name":"Mutuelle G\u00e9n\u00e9rale de l'\u00c9ducation Nationale","ror":"https://ror.org/029vj4k86","country_code":"FR","type":"nonprofit","lineage":["https://openalex.org/I4210115909"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Gohar Dashyan","raw_affiliation_strings":["Preligens,Paris,FRANCE","Preligens, Paris, FRANCE"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Preligens,Paris,FRANCE","institution_ids":["https://openalex.org/I4210115909"]},{"raw_affiliation_string":"Preligens, Paris, FRANCE","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046943453","display_name":"Jean\u2010Loup Guillaume","orcid":"https://orcid.org/0000-0002-4615-1563"},"institutions":[{"id":"https://openalex.org/I78744979","display_name":"La Rochelle Universit\u00e9","ror":"https://ror.org/04mv1z119","country_code":"FR","type":"education","lineage":["https://openalex.org/I78744979"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jean-Loup Guillaume","raw_affiliation_strings":["La Rochelle University,L3i,La Rochelle,FRANCE","L3i, La Rochelle University, La Rochelle, FRANCE"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"La Rochelle University,L3i,La Rochelle,FRANCE","institution_ids":["https://openalex.org/I78744979"]},{"raw_affiliation_string":"L3i, La Rochelle University, La Rochelle, FRANCE","institution_ids":["https://openalex.org/I78744979"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046944392","display_name":"Ahmed Hamdi","orcid":"https://orcid.org/0000-0002-8964-2135"},"institutions":[{"id":"https://openalex.org/I78744979","display_name":"La Rochelle Universit\u00e9","ror":"https://ror.org/04mv1z119","country_code":"FR","type":"education","lineage":["https://openalex.org/I78744979"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Ahmed Hamdi","raw_affiliation_strings":["La Rochelle University,L3i,La Rochelle,FRANCE","L3i, La Rochelle University, La Rochelle, FRANCE"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"La Rochelle University,L3i,La Rochelle,FRANCE","institution_ids":["https://openalex.org/I78744979"]},{"raw_affiliation_string":"L3i, La Rochelle University, La Rochelle, FRANCE","institution_ids":["https://openalex.org/I78744979"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050260555","display_name":"Lilian Sanselme","orcid":null},"institutions":[{"id":"https://openalex.org/I4210115909","display_name":"Mutuelle G\u00e9n\u00e9rale de l'\u00c9ducation Nationale","ror":"https://ror.org/029vj4k86","country_code":"FR","type":"nonprofit","lineage":["https://openalex.org/I4210115909"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Lilian Sanselme","raw_affiliation_strings":["Preligens,Paris,FRANCE","Preligens, Paris, FRANCE"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Preligens,Paris,FRANCE","institution_ids":["https://openalex.org/I4210115909"]},{"raw_affiliation_string":"Preligens, Paris, FRANCE","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033491986","display_name":"Antoine Doucet","orcid":"https://orcid.org/0000-0001-6160-3356"},"institutions":[{"id":"https://openalex.org/I78744979","display_name":"La Rochelle Universit\u00e9","ror":"https://ror.org/04mv1z119","country_code":"FR","type":"education","lineage":["https://openalex.org/I78744979"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Antoine Doucet","raw_affiliation_strings":["La Rochelle University,L3i,La Rochelle,FRANCE","L3i, La Rochelle University, La Rochelle, FRANCE"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"La Rochelle University,L3i,La Rochelle,FRANCE","institution_ids":["https://openalex.org/I78744979"]},{"raw_affiliation_string":"L3i, La Rochelle University, La Rochelle, FRANCE","institution_ids":["https://openalex.org/I78744979"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8158,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.7926329,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"4612","last_page":"4618"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.8400897979736328},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8012259602546692},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.7332739233970642},{"id":"https://openalex.org/keywords/digitization","display_name":"Digitization","score":0.6255118250846863},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6071908473968506},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5297252535820007},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.5088339447975159},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5009779930114746},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4284176528453827},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.42046457529067993},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3578495383262634},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.08843433856964111},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.08423033356666565}],"concepts":[{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.8400897979736328},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8012259602546692},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.7332739233970642},{"id":"https://openalex.org/C2779308522","wikidata":"https://www.wikidata.org/wiki/Q843958","display_name":"Digitization","level":2,"score":0.6255118250846863},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6071908473968506},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5297252535820007},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.5088339447975159},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5009779930114746},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4284176528453827},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.42046457529067993},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3578495383262634},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.08843433856964111},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.08423033356666565},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/smc53992.2023.10394665","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc53992.2023.10394665","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-04284004v1","is_oa":true,"landing_page_url":"https://hal.science/hal-04284004","pdf_url":"https://hal.science/hal-04284004/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Conference on Systems, Man, and Cybernetics, Oct 2023, Honolulu, United States. pp.4612-4618, &#x27E8;10.1109/SMC53992.2023.10394665&#x27E9;","raw_type":"Conference papers"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-04284004v1","is_oa":true,"landing_page_url":"https://hal.science/hal-04284004","pdf_url":"https://hal.science/hal-04284004/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Conference on Systems, Man, and Cybernetics, Oct 2023, Honolulu, United States. pp.4612-4618, &#x27E8;10.1109/SMC53992.2023.10394665&#x27E9;","raw_type":"Conference papers"},"sustainable_development_goals":[{"score":0.6100000143051147,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4391331168.pdf"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W745540356","https://openalex.org/W1523019309","https://openalex.org/W1541376310","https://openalex.org/W1573345323","https://openalex.org/W1821462560","https://openalex.org/W1976978162","https://openalex.org/W1977053705","https://openalex.org/W2043909051","https://openalex.org/W2044830896","https://openalex.org/W2069870183","https://openalex.org/W2212003014","https://openalex.org/W2500799460","https://openalex.org/W2896457183","https://openalex.org/W2900753330","https://openalex.org/W2945260553","https://openalex.org/W2951534261","https://openalex.org/W2978017171","https://openalex.org/W2982632725","https://openalex.org/W3012289950","https://openalex.org/W3015310959","https://openalex.org/W3049158684","https://openalex.org/W3098319558","https://openalex.org/W3155375847","https://openalex.org/W3180230246","https://openalex.org/W3202377836","https://openalex.org/W3213851456","https://openalex.org/W4205848394","https://openalex.org/W4213009331","https://openalex.org/W4221050583","https://openalex.org/W4230543443","https://openalex.org/W4288089799","https://openalex.org/W4318196853","https://openalex.org/W4320732451","https://openalex.org/W6621929542","https://openalex.org/W6632372736"],"related_works":["https://openalex.org/W1539704186","https://openalex.org/W4254109238","https://openalex.org/W2399890175","https://openalex.org/W4308177873","https://openalex.org/W3202479762","https://openalex.org/W2480493049","https://openalex.org/W2592115649","https://openalex.org/W4322582183","https://openalex.org/W1937392525","https://openalex.org/W2347632764"],"abstract_inverted_index":{"After":[0],"decades":[1],"of":[2,8,16,25,29,71,74,98,101,117,120,132,141],"massive":[3],"digitization,":[4],"a":[5,69,93,118],"sub-stantial":[6],"amount":[7],"documents":[9,18,31],"exists":[10],"in":[11,34,57,82],"digital":[12],"form.":[13],"The":[14,41],"accessibility":[15],"these":[17,30],"is":[19],"strongly":[20],"impacted":[21],"by":[22,107],"the":[23,72,99,121,139],"quality":[24],"document":[26,77,105,142],"indexing.":[27],"Most":[28],"are":[32,154],"indexed":[33],"noisy":[35,115,145],"versions":[36,116],"that":[37,153],"include":[38],"numerous":[39],"errors.":[40],"noise":[42,75],"can":[43],"be":[44],"due":[45],"to":[46,157],"manual":[47],"input":[48],"mistakes":[49],"or":[50],"optical":[51],"character":[52],"recognition":[53,102],"process":[54],"and":[55,64,95,130,147],"results":[56],"errors":[58,103],"like":[59],"spelling":[60],"mistakes,":[61],"missing":[62],"characters,":[63],"others.":[65],"This":[66],"paper":[67],"presents":[68],"study":[70,135],"impact":[73,100],"on":[76,104,113],"ranking,":[78],"an":[79],"essential":[80],"task":[81],"natural":[83],"language":[84],"processing":[85],"(NLP)":[86],"with":[87,127],"wide-ranging":[88],"practical":[89],"applications.":[90],"We":[91],"provide":[92],"deep":[94],"quantitative":[96],"analysis":[97],"ranking":[106,111,125,143,151],"testing":[108],"two":[109],"popular":[110],"models":[112,152],"several":[114],"subset":[119],"MS":[122],"MARCO":[123],"passage":[124],"dataset,":[126],"various":[128],"levels":[129],"types":[131],"noise.":[133,158],"Our":[134],"provides":[136],"insights":[137],"into":[138],"challenges":[140],"under":[144],"conditions":[146],"advocates":[148],"for":[149],"developing":[150],"more":[155],"robust":[156]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
