{"id":"https://openalex.org/W2802763641","doi":"https://doi.org/10.1145/3169795","title":"Duplicate Detection in Programming Question Answering Communities","display_name":"Duplicate Detection in Programming Question Answering Communities","publication_year":2018,"publication_date":"2018-04-17","ids":{"openalex":"https://openalex.org/W2802763641","doi":"https://doi.org/10.1145/3169795","mag":"2802763641"},"language":"en","primary_location":{"id":"doi:10.1145/3169795","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3169795","pdf_url":null,"source":{"id":"https://openalex.org/S97833917","display_name":"ACM Transactions on Internet Technology","issn_l":"1533-5399","issn":["1533-5399","1557-6051"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Internet Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070697660","display_name":"Wei Emma Zhang","orcid":"https://orcid.org/0000-0002-0406-5974"},"institutions":[{"id":"https://openalex.org/I99043593","display_name":"Macquarie University","ror":"https://ror.org/01sf06y89","country_code":"AU","type":"education","lineage":["https://openalex.org/I99043593"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Wei Emma Zhang","raw_affiliation_strings":["Macquarie University, Australia"],"affiliations":[{"raw_affiliation_string":"Macquarie University, Australia","institution_ids":["https://openalex.org/I99043593"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080744092","display_name":"Quan Z. Sheng","orcid":"https://orcid.org/0000-0002-3326-4147"},"institutions":[{"id":"https://openalex.org/I99043593","display_name":"Macquarie University","ror":"https://ror.org/01sf06y89","country_code":"AU","type":"education","lineage":["https://openalex.org/I99043593"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Quan Z. Sheng","raw_affiliation_strings":["Macquarie University, Australia"],"affiliations":[{"raw_affiliation_string":"Macquarie University, Australia","institution_ids":["https://openalex.org/I99043593"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032767467","display_name":"Jey Han Lau","orcid":"https://orcid.org/0000-0002-1647-4628"},"institutions":[{"id":"https://openalex.org/I4210120068","display_name":"IBM Research - Australia","ror":"https://ror.org/027r3nx49","country_code":"AU","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210120068"]},{"id":"https://openalex.org/I165779595","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Jey Han Lau","raw_affiliation_strings":["The University of Melbourne and IBM Research Australia, Australia"],"affiliations":[{"raw_affiliation_string":"The University of Melbourne and IBM Research Australia, Australia","institution_ids":["https://openalex.org/I4210120068","https://openalex.org/I165779595"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005140412","display_name":"Ermyas Abebe","orcid":null},"institutions":[{"id":"https://openalex.org/I4210120068","display_name":"IBM Research - Australia","ror":"https://ror.org/027r3nx49","country_code":"AU","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210120068"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Ermyas Abebe","raw_affiliation_strings":["IBM Research Australia, Australia"],"affiliations":[{"raw_affiliation_string":"IBM Research Australia, Australia","institution_ids":["https://openalex.org/I4210120068"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074225885","display_name":"Wenjie Ruan","orcid":"https://orcid.org/0000-0002-8311-8738"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Wenjie Ruan","raw_affiliation_strings":["University of Oxford, Oxford, UK"],"affiliations":[{"raw_affiliation_string":"University of Oxford, Oxford, UK","institution_ids":["https://openalex.org/I40120149"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5070697660"],"corresponding_institution_ids":["https://openalex.org/I99043593"],"apc_list":null,"apc_paid":null,"fwci":2.1175,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.90097077,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"18","issue":"3","first_page":"1","last_page":"21"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8683341145515442},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6858826875686646},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.6822413802146912},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.640186071395874},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5720124840736389},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5413411259651184},{"id":"https://openalex.org/keywords/learning-to-rank","display_name":"Learning to rank","score":0.5025515556335449},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.4696003198623657},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4695473313331604},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37918710708618164},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3372838795185089},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.1384543776512146}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8683341145515442},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6858826875686646},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.6822413802146912},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.640186071395874},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5720124840736389},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5413411259651184},{"id":"https://openalex.org/C86037889","wikidata":"https://www.wikidata.org/wiki/Q4330127","display_name":"Learning to rank","level":3,"score":0.5025515556335449},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.4696003198623657},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4695473313331604},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37918710708618164},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3372838795185089},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.1384543776512146},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3169795","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3169795","pdf_url":null,"source":{"id":"https://openalex.org/S97833917","display_name":"ACM Transactions on Internet Technology","issn_l":"1533-5399","issn":["1533-5399","1557-6051"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Internet Technology","raw_type":"journal-article"},{"id":"pmh:oai:digital.library.adelaide.edu.au:2440/121076","is_oa":false,"landing_page_url":"http://hdl.handle.net/2440/121076","pdf_url":null,"source":{"id":"https://openalex.org/S4306401835","display_name":"Adelaide Research & Scholarship (AR&S) (University of Adelaide)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I5681781","host_organization_name":"The University of Adelaide","host_organization_lineage":["https://openalex.org/I5681781"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://dx.doi.org/10.1145/3169795","raw_type":"Journal article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8299999833106995,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W1482214997","https://openalex.org/W1493309689","https://openalex.org/W1566018662","https://openalex.org/W1597533204","https://openalex.org/W1880262756","https://openalex.org/W1972594981","https://openalex.org/W1975809876","https://openalex.org/W1980095184","https://openalex.org/W1985258161","https://openalex.org/W1988790447","https://openalex.org/W1999822363","https://openalex.org/W2008056655","https://openalex.org/W2008652694","https://openalex.org/W2035363410","https://openalex.org/W2038721957","https://openalex.org/W2060758175","https://openalex.org/W2086530517","https://openalex.org/W2091825929","https://openalex.org/W2093219119","https://openalex.org/W2103305545","https://openalex.org/W2105157020","https://openalex.org/W2113242816","https://openalex.org/W2118978333","https://openalex.org/W2119168550","https://openalex.org/W2120284981","https://openalex.org/W2123246351","https://openalex.org/W2124940540","https://openalex.org/W2131744502","https://openalex.org/W2151280665","https://openalex.org/W2153579005","https://openalex.org/W2156985047","https://openalex.org/W2160218441","https://openalex.org/W2239327973","https://openalex.org/W2250225488","https://openalex.org/W2250565861","https://openalex.org/W2251427843","https://openalex.org/W2252136820","https://openalex.org/W2282146481","https://openalex.org/W2293877768","https://openalex.org/W2340381866","https://openalex.org/W2401290433","https://openalex.org/W2477400917","https://openalex.org/W2604420197","https://openalex.org/W2950133940","https://openalex.org/W2963514026","https://openalex.org/W3009009611","https://openalex.org/W3085162807","https://openalex.org/W4238530616"],"related_works":["https://openalex.org/W3127142483","https://openalex.org/W3160516639","https://openalex.org/W4385565564","https://openalex.org/W2898073868","https://openalex.org/W2138488530","https://openalex.org/W2971071571","https://openalex.org/W2798835721","https://openalex.org/W2922169395","https://openalex.org/W2387658907","https://openalex.org/W2385796165"],"abstract_inverted_index":{"Community-based":[0],"Question":[1],"Answering":[2],"(CQA)":[3],"websites":[4,23],"are":[5,25],"attracting":[6],"increasing":[7],"numbers":[8],"of":[9,61,81,111,118],"users":[10],"and":[11,24,102,158,184,195],"contributors":[12],"in":[13,21,75,192,214],"recent":[14],"years.":[15],"However,":[16],"duplicate":[17,33,130],"questions":[18,120,148,202],"frequently":[19],"occur":[20],"CQA":[22,77,82],"currently":[26],"manually":[27],"identified":[28],"by":[29],"the":[30,50,91,99,109,141,146,154,160,168,172,223],"moderators.":[31],"Automatic":[32],"detection,":[34],"on":[35,49,98,104,187,200],"one":[36],"hand,":[37,52],"alleviates":[38],"this":[39],"laborious":[40],"effort":[41],"for":[42],"moderators":[43],"before":[44],"taking":[45],"close":[46],"actions,":[47],"and,":[48],"other":[51],"helps":[53],"question":[54,100,138,157,188],"issuers":[55],"quickly":[56],"find":[57],"answers.":[58],"A":[59],"number":[60],"studies":[62],"have":[63],"looked":[64],"into":[65],"related":[66],"problems,":[67],"but":[68],"very":[69,212],"limited":[70],"works":[71,89,211],"target":[72],"Duplicate":[73],"Detection":[74],"Programming":[76],"(PCQA),":[78],"a":[79,94,133],"branch":[80],"that":[83,179,208],"is":[84,121],"dedicated":[85],"to":[86,150,153,166,218,222],"programmers.":[87],"Existing":[88],"framed":[90],"task":[92],"as":[93,132,164],"supervised":[95],"learning":[96,194],"problem":[97,136],"pairs":[101],"relied":[103],"only":[105],"textual":[106,182],"features.":[107],"Moreover,":[108],"issue":[110],"selecting":[112],"candidate":[113],"duplicates":[114],"from":[115],"large":[116],"volumes":[117],"historical":[119,147],"often":[122],"un-addressed.":[123],"To":[124],"tackle":[125],"these":[126],"issues,":[127],"we":[128,144,175],"model":[129],"detection":[131],"two-stage":[134],"\u201cranking-classification\u201d":[135],"over":[137],"pairs.":[139],"In":[140,171],"first":[142],"stage,":[143,174],"rank":[145],"according":[149],"their":[151],"similarities":[152],"newly":[155],"issued":[156],"select":[159],"top":[161],"ranked":[162],"ones":[163],"candidates":[165],"reduce":[167],"search":[169],"space.":[170],"second":[173],"develop":[176],"novel":[177],"features":[178],"capture":[180],"both":[181],"similarity":[183],"latent":[185],"semantics":[186],"pairs,":[189],"leveraging":[190],"techniques":[191],"deep":[193],"information":[196],"retrieval":[197],"literature.":[198],"Experiments":[199],"real-world":[201],"about":[203],"multiple":[204],"programming":[205],"languages":[206],"demonstrate":[207],"our":[209],"method":[210],"well;":[213],"some":[215],"cases,":[216],"up":[217],"25%":[219],"improvement":[220],"compared":[221],"state-of-the-art":[224],"benchmarks.":[225]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
