{"id":"https://openalex.org/W2895458936","doi":"https://doi.org/10.18653/v1/w18-6103","title":"Geocoding Without Geotags: A Text-based Approach for reddit","display_name":"Geocoding Without Geotags: A Text-based Approach for reddit","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2895458936","doi":"https://doi.org/10.18653/v1/w18-6103","mag":"2895458936"},"language":"en","primary_location":{"id":"doi:10.18653/v1/w18-6103","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w18-6103","pdf_url":"https://www.aclweb.org/anthology/W18-6103.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 EMNLP Workshop W-NUT: The 4th Workshop on Noisy User-generated Text","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/W18-6103.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080826010","display_name":"Keith Harrigian","orcid":"https://orcid.org/0000-0001-9483-8469"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Keith Harrigian","raw_affiliation_strings":["Warner Media Applied Analytics Boston, MA"],"affiliations":[{"raw_affiliation_string":"Warner Media Applied Analytics Boston, MA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5080826010"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.6706,"has_fulltext":true,"cited_by_count":26,"citation_normalized_percentile":{"value":0.92051832,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"17","last_page":"27"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11980","display_name":"Human Mobility and Location-Based Analysis","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11980","display_name":"Human Mobility and Location-Based Analysis","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11819","display_name":"Data-Driven Disease Surveillance","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.953499972820282,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/geolocation","display_name":"Geolocation","score":0.9505084753036499},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8104990720748901},{"id":"https://openalex.org/keywords/geocoding","display_name":"Geocoding","score":0.7265154123306274},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7184662818908691},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.6452510952949524},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.6067472100257874},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.6021963953971863},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5782251358032227},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.449546754360199},{"id":"https://openalex.org/keywords/schema","display_name":"Schema (genetic algorithms)","score":0.43715909123420715},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4250318109989166},{"id":"https://openalex.org/keywords/geotagging","display_name":"Geotagging","score":0.4211881756782532},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3647342622280121},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32657590508461},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.20669332146644592}],"concepts":[{"id":"https://openalex.org/C22041718","wikidata":"https://www.wikidata.org/wiki/Q638949","display_name":"Geolocation","level":2,"score":0.9505084753036499},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8104990720748901},{"id":"https://openalex.org/C42629822","wikidata":"https://www.wikidata.org/wiki/Q1346408","display_name":"Geocoding","level":2,"score":0.7265154123306274},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7184662818908691},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.6452510952949524},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.6067472100257874},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.6021963953971863},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5782251358032227},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.449546754360199},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.43715909123420715},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4250318109989166},{"id":"https://openalex.org/C53605480","wikidata":"https://www.wikidata.org/wiki/Q852595","display_name":"Geotagging","level":2,"score":0.4211881756782532},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3647342622280121},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32657590508461},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.20669332146644592},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/w18-6103","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w18-6103","pdf_url":"https://www.aclweb.org/anthology/W18-6103.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 EMNLP Workshop W-NUT: The 4th Workshop on Noisy User-generated Text","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/w18-6103","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w18-6103","pdf_url":"https://www.aclweb.org/anthology/W18-6103.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2018 EMNLP Workshop W-NUT: The 4th Workshop on Noisy User-generated Text","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2895458936.pdf","grobid_xml":"https://content.openalex.org/works/W2895458936.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W150644790","https://openalex.org/W802248758","https://openalex.org/W1550708636","https://openalex.org/W1984189333","https://openalex.org/W1984272552","https://openalex.org/W2007791237","https://openalex.org/W2018277822","https://openalex.org/W2022496558","https://openalex.org/W2040324983","https://openalex.org/W2044688197","https://openalex.org/W2082260230","https://openalex.org/W2091802992","https://openalex.org/W2103133870","https://openalex.org/W2112594516","https://openalex.org/W2127498532","https://openalex.org/W2136518070","https://openalex.org/W2137435333","https://openalex.org/W2139329027","https://openalex.org/W2142191319","https://openalex.org/W2142889507","https://openalex.org/W2164631912","https://openalex.org/W2168346693","https://openalex.org/W2172085063","https://openalex.org/W2196009790","https://openalex.org/W2213844264","https://openalex.org/W2250457198","https://openalex.org/W2251535681","https://openalex.org/W2282112529","https://openalex.org/W2464870181","https://openalex.org/W2467321947","https://openalex.org/W2776671924","https://openalex.org/W2791575854","https://openalex.org/W2805571859","https://openalex.org/W2902405430","https://openalex.org/W2963145593","https://openalex.org/W2963666326","https://openalex.org/W3102617382"],"related_works":["https://openalex.org/W1718163567","https://openalex.org/W4300347823","https://openalex.org/W3195869169","https://openalex.org/W4366460429","https://openalex.org/W3021787161","https://openalex.org/W4220951331","https://openalex.org/W4313533154","https://openalex.org/W4283791994","https://openalex.org/W797920393","https://openalex.org/W2019957373"],"abstract_inverted_index":{"In":[0,31],"this":[1],"paper,":[2],"we":[3,33,63,84],"introduce":[4],"the":[5,49,57,93],"first":[6],"geolocation":[7,68,80,87],"inference":[8,25,69],"approach":[9],"for":[10,45],"reddit,":[11],"a":[12,35],"social":[13],"media":[14],"platform":[15],"where":[16,111],"user":[17],"pseudonymity":[18],"has":[19],"thus":[20],"far":[21],"made":[22],"supervised":[23],"demographic":[24],"difficult":[26],"to":[27,39,100,118],"implement":[28],"and":[29,65,76,90],"validate.":[30],"particular,":[32],"design":[34],"text-based":[36],"heuristic":[37],"schema":[38],"generate":[40],"ground":[41],"truth":[42],"location":[43],"labels":[44],"reddit":[46,73,110],"users":[47],"in":[48],"absence":[50],"of":[51,59],"explicitly":[52],"geotagged":[53],"data.":[54],"After":[55],"evaluating":[56],"accuracy":[58],"our":[60,72],"labeling":[61],"procedure,":[62],"train":[64],"test":[66],"several":[67],"models":[70,88,98],"across":[71,104],"data":[74,81,103],"set":[75],"three":[77],"benchmark":[78],"Twitter":[79],"sets.":[82],"Ultimately,":[83],"show":[85],"that":[86],"trained":[89],"applied":[91],"on":[92,109],"same":[94],"domain":[95],"substantially":[96],"outperform":[97],"attempting":[99],"transfer":[101],"training":[102],"domains,":[105],"even":[106],"more":[107],"so":[108],"platformspecific":[112],"interest-group":[113],"metadata":[114],"can":[115],"be":[116],"used":[117],"improve":[119],"inferences.":[120]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":7},{"year":2019,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
