{"id":"https://openalex.org/W4387608567","doi":"https://doi.org/10.15439/2023f7569","title":"Improving Domain-Specific Retrieval by NLI Fine-Tuning","display_name":"Improving Domain-Specific Retrieval by NLI Fine-Tuning","publication_year":2023,"publication_date":"2023-09-26","ids":{"openalex":"https://openalex.org/W4387608567","doi":"https://doi.org/10.15439/2023f7569"},"language":"en","primary_location":{"id":"doi:10.15439/2023f7569","is_oa":true,"landing_page_url":"http://dx.doi.org/10.15439/2023f7569","pdf_url":"https://annals-csis.org/proceedings/2023/drp/pdf/7569.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://annals-csis.org/proceedings/2023/drp/pdf/7569.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092616533","display_name":"Roman Du\u0161ek","orcid":"https://orcid.org/0009-0009-6388-9488"},"institutions":[{"id":"https://openalex.org/I99542240","display_name":"Polish Academy of Sciences","ror":"https://ror.org/01dr6c206","country_code":"PL","type":"government","lineage":["https://openalex.org/I99542240"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Roman Dusek","raw_affiliation_strings":["Allegro sp. z o.o. Wierzbi\u0119cice 1B, 61-569 Pozna\u0144, Poland","Institue of Compter Science, Polish Academy of Sciences Jana Kazimierza 5, 01-248 Warszawa"],"affiliations":[{"raw_affiliation_string":"Allegro sp. z o.o. Wierzbi\u0119cice 1B, 61-569 Pozna\u0144, Poland","institution_ids":[]},{"raw_affiliation_string":"Institue of Compter Science, Polish Academy of Sciences Jana Kazimierza 5, 01-248 Warszawa","institution_ids":["https://openalex.org/I99542240"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000658598","display_name":"Aleksander Wawer","orcid":"https://orcid.org/0000-0002-7081-9797"},"institutions":[{"id":"https://openalex.org/I99542240","display_name":"Polish Academy of Sciences","ror":"https://ror.org/01dr6c206","country_code":"PL","type":"government","lineage":["https://openalex.org/I99542240"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Aleksander Wawer","raw_affiliation_strings":["Allegro sp. z o.o. Wierzbi\u0119cice 1B, 61-569 Pozna\u0144, Poland","Institue of Compter Science, Polish Academy of Sciences Jana Kazimierza 5, 01-248 Warszawa"],"affiliations":[{"raw_affiliation_string":"Allegro sp. z o.o. Wierzbi\u0119cice 1B, 61-569 Pozna\u0144, Poland","institution_ids":[]},{"raw_affiliation_string":"Institue of Compter Science, Polish Academy of Sciences Jana Kazimierza 5, 01-248 Warszawa","institution_ids":["https://openalex.org/I99542240"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029928593","display_name":"Christopher Galias","orcid":null},"institutions":[{"id":"https://openalex.org/I99542240","display_name":"Polish Academy of Sciences","ror":"https://ror.org/01dr6c206","country_code":"PL","type":"government","lineage":["https://openalex.org/I99542240"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Christopher Galias","raw_affiliation_strings":["Allegro sp. z o.o. Wierzbi\u0119cice 1B, 61-569 Pozna\u0144, Poland","Institue of Compter Science, Polish Academy of Sciences Jana Kazimierza 5, 01-248 Warszawa"],"affiliations":[{"raw_affiliation_string":"Allegro sp. z o.o. Wierzbi\u0119cice 1B, 61-569 Pozna\u0144, Poland","institution_ids":[]},{"raw_affiliation_string":"Institue of Compter Science, Polish Academy of Sciences Jana Kazimierza 5, 01-248 Warszawa","institution_ids":["https://openalex.org/I99542240"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5092616534","display_name":"Lidia Wojciechowska","orcid":null},"institutions":[{"id":"https://openalex.org/I99542240","display_name":"Polish Academy of Sciences","ror":"https://ror.org/01dr6c206","country_code":"PL","type":"government","lineage":["https://openalex.org/I99542240"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Lidia Wojciechowska","raw_affiliation_strings":["Allegro sp. z o.o. Wierzbi\u0119cice 1B, 61-569 Pozna\u0144, Poland","Institue of Compter Science, Polish Academy of Sciences Jana Kazimierza 5, 01-248 Warszawa"],"affiliations":[{"raw_affiliation_string":"Allegro sp. z o.o. Wierzbi\u0119cice 1B, 61-569 Pozna\u0144, Poland","institution_ids":[]},{"raw_affiliation_string":"Institue of Compter Science, Polish Academy of Sciences Jana Kazimierza 5, 01-248 Warszawa","institution_ids":["https://openalex.org/I99542240"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5092616533"],"corresponding_institution_ids":["https://openalex.org/I99542240"],"apc_list":null,"apc_paid":null,"fwci":0.112,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.30995358,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"35","issue":null,"first_page":"949","last_page":"953"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.8729000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.8729000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.7724000215530396,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.7085999846458435,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6837468147277832},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5361226797103882},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3705732226371765},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.32866770029067993},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12115836143493652}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6837468147277832},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5361226797103882},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3705732226371765},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.32866770029067993},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12115836143493652},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.15439/2023f7569","is_oa":true,"landing_page_url":"http://dx.doi.org/10.15439/2023f7569","pdf_url":"https://annals-csis.org/proceedings/2023/drp/pdf/7569.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:doaj.org/article:49b2621af191495899e52a59da2a0000","is_oa":true,"landing_page_url":"https://doaj.org/article/49b2621af191495899e52a59da2a0000","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Annals of computer science and information systems, Vol 35, Pp 949-953 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.15439/2023f7569","is_oa":true,"landing_page_url":"http://dx.doi.org/10.15439/2023f7569","pdf_url":"https://annals-csis.org/proceedings/2023/drp/pdf/7569.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387608567.pdf","grobid_xml":"https://content.openalex.org/works/W4387608567.grobid-xml"},"referenced_works_count":27,"referenced_works":["https://openalex.org/W1840435438","https://openalex.org/W2739744877","https://openalex.org/W2896457183","https://openalex.org/W2961915345","https://openalex.org/W2982153178","https://openalex.org/W2983040767","https://openalex.org/W2998702515","https://openalex.org/W3021457404","https://openalex.org/W3027758526","https://openalex.org/W3035390927","https://openalex.org/W3035614045","https://openalex.org/W3038033387","https://openalex.org/W3093681740","https://openalex.org/W3099977667","https://openalex.org/W3105214104","https://openalex.org/W3118062200","https://openalex.org/W3155292524","https://openalex.org/W3156636935","https://openalex.org/W3157789198","https://openalex.org/W4220818323","https://openalex.org/W4225565720","https://openalex.org/W4283702870","https://openalex.org/W6734897383","https://openalex.org/W6769444473","https://openalex.org/W6777048723","https://openalex.org/W6783561170","https://openalex.org/W7054915730"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2530322880","https://openalex.org/W1596801655","https://openalex.org/W2359140296"],"abstract_inverted_index":{"The":[0],"aim":[1],"of":[2,11,35,74,96,103],"this":[3,24],"article":[4],"is":[5],"to":[6,17,65,86,99],"investigate":[7,92],"the":[8,36,66,72,75,84,97,101],"finetuning":[9],"potential":[10,85],"natural":[12],"language":[13],"inference":[14],"(NLI)":[15],"data":[16,32],"improve":[18,87],"information":[19],"retrieval":[20],"and":[21,28,41,48,60,80,94],"ranking.We":[22],"demonstrate":[23],"for":[25,106],"both":[26,46,78,81],"English":[27],"Polish":[29,38],"languages,":[30,82],"using":[31],"from":[33],"one":[34],"largest":[37],"e-commerce":[39],"sites":[40],"selected":[42],"opendomain":[43],"datasets.We":[44],"employ":[45],"monolingual":[47],"multilingual":[49,89],"sentence":[50],"encoders":[51],"fine-tuned":[52],"by":[53],"a":[54],"supervised":[55],"method":[56],"utilizing":[57],"contrastive":[58],"loss":[59],"NLI":[61,69],"data.Our":[62],"results":[63],"point":[64],"fact":[67],"that":[68],"fine-tuning":[70,105],"increases":[71],"performance":[73],"models":[76],"in":[77],"tasks":[79],"with":[83],"monoand":[88],"models.Finally,":[90],"we":[91],"uniformity":[93],"alignment":[95],"embeddings":[98],"explain":[100],"effect":[102],"NLI-based":[104],"an":[107],"out-of-domain":[108],"use-case.":[109]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-10T14:07:55.174380","created_date":"2025-10-10T00:00:00"}
