{"id":"https://openalex.org/W2121152637","doi":"https://doi.org/10.1145/1088622.1088644","title":"Collecting paraphrase corpora from volunteer contributors","display_name":"Collecting paraphrase corpora from volunteer contributors","publication_year":2005,"publication_date":"2005-10-02","ids":{"openalex":"https://openalex.org/W2121152637","doi":"https://doi.org/10.1145/1088622.1088644","mag":"2121152637"},"language":"en","primary_location":{"id":"doi:10.1145/1088622.1088644","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1088622.1088644","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 3rd international conference on Knowledge capture","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012269989","display_name":"Timothy Chklovski","orcid":null},"institutions":[{"id":"https://openalex.org/I2801204180","display_name":"Marina Del Rey Hospital","ror":"https://ror.org/05wqyfz02","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I2801204180"]},{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Timothy Chklovski","raw_affiliation_strings":["University of Southern California, Marina del Rey, CA"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Marina del Rey, CA","institution_ids":["https://openalex.org/I2801204180","https://openalex.org/I1174212"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5012269989"],"corresponding_institution_ids":["https://openalex.org/I1174212","https://openalex.org/I2801204180"],"apc_list":null,"apc_paid":null,"fwci":2.7425,"has_fulltext":false,"cited_by_count":39,"citation_normalized_percentile":{"value":0.9124736,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/paraphrase","display_name":"Paraphrase","score":0.9945851564407349},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7824467420578003},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.6358396410942078},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6347717046737671},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6160972714424133},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.49963927268981934},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.4722428023815155},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.36719053983688354}],"concepts":[{"id":"https://openalex.org/C2780922921","wikidata":"https://www.wikidata.org/wiki/Q255189","display_name":"Paraphrase","level":2,"score":0.9945851564407349},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7824467420578003},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.6358396410942078},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6347717046737671},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6160972714424133},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.49963927268981934},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.4722428023815155},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.36719053983688354},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1088622.1088644","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1088622.1088644","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 3rd international conference on Knowledge capture","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.512.8466","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.512.8466","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.isi.edu/div3/div3/pubs/papers/chklovski2005collecting.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.8199999928474426}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1507749094","https://openalex.org/W1558641428","https://openalex.org/W1602373044","https://openalex.org/W1980776243","https://openalex.org/W2031071990","https://openalex.org/W2053830012","https://openalex.org/W2085567745","https://openalex.org/W2098217544","https://openalex.org/W2113632140","https://openalex.org/W2118119027","https://openalex.org/W2129468719","https://openalex.org/W2141282920","https://openalex.org/W2162754088","https://openalex.org/W2163022864","https://openalex.org/W6630405400"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2978707643","https://openalex.org/W2294233724","https://openalex.org/W4378713476","https://openalex.org/W4281690070","https://openalex.org/W2169813772","https://openalex.org/W4310803295","https://openalex.org/W2736149021","https://openalex.org/W2398825887","https://openalex.org/W2135591339"],"abstract_inverted_index":{"Extensive":[0],"and":[1,14,35,59,80,100,108,118],"deep":[2],"paraphrase":[3],"corpora":[4],"are":[5],"important":[6],"for":[7],"a":[8],"variety":[9],"of":[10,90,124],"natural":[11],"language":[12],"processing":[13],"user":[15],"interaction":[16],"tasks.":[17],"In":[18],"this":[19],"paper,":[20],"we":[21,71],"present":[22,107],"an":[23,74],"approach":[24,44,94],"which":[25],"i)":[26],"collects":[27],"multiple":[28],"paraphrases":[29,48,55,89],"per":[30],"given":[31],"item":[32],"from":[33,49],"volunteers":[34],"ii)":[36],"incentivises":[37],"responsible":[38],"contributions":[39],"by":[40],"volunteer":[41],"contributors.":[42],"Our":[43],"is":[45],"to":[46,62,83],"solicit":[47],"Web":[50],"volunteers,":[51],"both":[52],"collecting":[53],"new":[54],"with":[56],"no":[57],"prompting":[58],"asking":[60],"contributors":[61],"guess":[63],"partially":[64],"obfuscated":[65],"paraphrases.":[66],"To":[67],"test":[68],"the":[69,122,125],"approach,":[70],"have":[72],"implemented":[73],"online":[75],"game,":[76],"1001":[77],"Paraphrases":[78],"(http://ai-games.org/paraphrase.html),":[79],"deployed":[81],"it":[82],"collect":[84],"20,944":[85],"entries":[86],"focused":[87],"on":[88],"400":[91],"statements.":[92],"The":[93],"complements":[95],"existing":[96],"text":[97],"extraction":[98],"methods":[99],"has":[101],"some":[102],"inherent":[103],"unique":[104],"advantages.":[105],"We":[106],"motivate":[109],"our":[110],"design":[111],"as":[112,114],"well":[113],"share":[115],"preliminary":[116],"observations":[117],"lessons":[119],"learned":[120],"about":[121],"performance":[123],"approach.":[126]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":6},{"year":2013,"cited_by_count":4},{"year":2012,"cited_by_count":6}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
