{"id":"https://openalex.org/W3135677775","doi":"https://doi.org/10.1145/3448139.3448205","title":"Toward Semi-Automatic Misconception Discovery Using Code Embeddings","display_name":"Toward Semi-Automatic Misconception Discovery Using Code Embeddings","publication_year":2021,"publication_date":"2021-04-05","ids":{"openalex":"https://openalex.org/W3135677775","doi":"https://doi.org/10.1145/3448139.3448205","mag":"3135677775"},"language":"en","primary_location":{"id":"doi:10.1145/3448139.3448205","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3448139.3448205","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"LAK21: 11th International Learning Analytics and Knowledge Conference","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2103.04448","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069526885","display_name":"Yang Shi","orcid":"https://orcid.org/0000-0001-6486-4340"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yang Shi","raw_affiliation_strings":["North Carolina State University, United States"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, United States","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048962612","display_name":"Krupal Shah","orcid":null},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Krupal Shah","raw_affiliation_strings":["North Carolina State University, United States"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, United States","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025684876","display_name":"Wengran Wang","orcid":"https://orcid.org/0009-0006-9364-5474"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wengran Wang","raw_affiliation_strings":["North Carolina State University, United States"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, United States","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005168403","display_name":"Samiha Marwan","orcid":"https://orcid.org/0000-0001-5283-3395"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Samiha Marwan","raw_affiliation_strings":["North Carolina State University, United States"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, United States","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084543165","display_name":"Poorvaja Penmetsa","orcid":null},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Poorvaja Penmetsa","raw_affiliation_strings":["North Carolina State University, United States"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, United States","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064676990","display_name":"Thomas Price","orcid":"https://orcid.org/0000-0001-9375-2292"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Thomas Price","raw_affiliation_strings":["North Carolina State University, United States"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, United States","institution_ids":["https://openalex.org/I137902535"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5069526885"],"corresponding_institution_ids":["https://openalex.org/I137902535"],"apc_list":null,"apc_paid":null,"fwci":4.5507,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.94846881,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"606","last_page":"612"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11122","display_name":"Online Learning and Analytics","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9750999808311462,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7969647645950317},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.6250982284545898},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6232474446296692},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6077147722244263},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.5264421701431274},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.5058317184448242},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34060555696487427},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.22190004587173462}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7969647645950317},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.6250982284545898},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6232474446296692},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6077147722244263},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5264421701431274},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.5058317184448242},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34060555696487427},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.22190004587173462},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3448139.3448205","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3448139.3448205","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"LAK21: 11th International Learning Analytics and Knowledge Conference","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2103.04448","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.04448","pdf_url":"https://arxiv.org/pdf/2103.04448","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2103.04448","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.04448","pdf_url":"https://arxiv.org/pdf/2103.04448","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5199999809265137,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320310598","display_name":"Amazon Web Services","ror":"https://ror.org/04mv4n011"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1521965716","https://openalex.org/W1522301498","https://openalex.org/W1539191223","https://openalex.org/W1598140581","https://openalex.org/W1673310716","https://openalex.org/W1861616335","https://openalex.org/W1991469716","https://openalex.org/W1994532632","https://openalex.org/W1995969371","https://openalex.org/W2074659968","https://openalex.org/W2076771354","https://openalex.org/W2101355109","https://openalex.org/W2108342609","https://openalex.org/W2129740354","https://openalex.org/W2133002245","https://openalex.org/W2153579005","https://openalex.org/W2186498586","https://openalex.org/W2187089797","https://openalex.org/W2247854788","https://openalex.org/W2257123346","https://openalex.org/W2263367457","https://openalex.org/W2275572593","https://openalex.org/W2328992837","https://openalex.org/W2337738304","https://openalex.org/W2413305997","https://openalex.org/W2462557479","https://openalex.org/W2605015267","https://openalex.org/W2605403059","https://openalex.org/W2729115344","https://openalex.org/W2791180937","https://openalex.org/W2806965553","https://openalex.org/W2885048964","https://openalex.org/W2917037155","https://openalex.org/W2951767646","https://openalex.org/W2962995178","https://openalex.org/W2964150020","https://openalex.org/W2964828327","https://openalex.org/W2966643894","https://openalex.org/W4236340759","https://openalex.org/W4294170691"],"related_works":["https://openalex.org/W2081900870","https://openalex.org/W2037549926","https://openalex.org/W2345479200","https://openalex.org/W2183306018","https://openalex.org/W2849310602","https://openalex.org/W3006008237","https://openalex.org/W2419146053","https://openalex.org/W4388890789","https://openalex.org/W2088247287","https://openalex.org/W2963903416"],"abstract_inverted_index":{"Understanding":[0],"students\u2019":[1,58,126],"misconceptions":[2,13,56,96,121],"is":[3],"important":[4],"for":[5,50],"effective":[6],"teaching":[7],"and":[8,18,79,100,118],"assessment.":[9],"However,":[10],"discovering":[11],"such":[12],"manually":[14],"can":[15,23,36],"be":[16],"time-consuming":[17],"laborious.":[19],"Automated":[20],"misconception":[21],"discovery":[22,53],"address":[24],"these":[25,91,120],"challenges":[26],"by":[27],"highlighting":[28],"patterns":[29],"in":[30,61],"student":[31,87],"data,":[32],"which":[33],"domain":[34],"experts":[35],"then":[37],"inspect":[38],"to":[39,84,94],"identify":[40],"misconceptions.":[41],"In":[42],"this":[43],"work,":[44],"we":[45],"present":[46],"a":[47,65,75],"novel":[48],"method":[49],"the":[51,72,81,98],"semi-automated":[52],"of":[54,115],"problem-specific":[55],"from":[57],"program":[59],"code":[60,67],"computing":[62],"courses,":[63],"using":[64],"state-of-the-art":[66],"classification":[68],"model.":[69],"We":[70,89,110],"trained":[71],"model":[73],"on":[74],"block-based":[76],"programming":[77],"dataset":[78],"used":[80],"learned":[82],"embedding":[83],"cluster":[85],"incorrect":[86],"submissions.":[88],"found":[90],"clusters":[92],"correspond":[93],"specific":[95],"about":[97],"problem":[99],"would":[101],"not":[102],"have":[103],"been":[104],"easily":[105],"discovered":[106],"with":[107],"existing":[108],"approaches.":[109],"also":[111],"discuss":[112],"potential":[113],"applications":[114],"our":[116],"approach":[117],"how":[119],"inform":[122],"domain-specific":[123],"insights":[124],"into":[125],"learning":[127],"processes.":[128]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":3}],"updated_date":"2026-04-07T14:57:38.498316","created_date":"2025-10-10T00:00:00"}
