{"id":"https://openalex.org/W3197876970","doi":"https://doi.org/10.18653/v1/2021.emnlp-demo.21","title":"Datasets: A Community Library for Natural Language Processing","display_name":"Datasets: A Community Library for Natural Language Processing","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3197876970","doi":"https://doi.org/10.18653/v1/2021.emnlp-demo.21","mag":"3197876970"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2021.emnlp-demo.21","pdf_url":"https://aclanthology.org/2021.emnlp-demo.21.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"type":"preprint","type_crossref":"proceedings-article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://aclanthology.org/2021.emnlp-demo.21.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074885928","display_name":"Quentin Lhoest","orcid":"https://orcid.org/0009-0000-7660-3420"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Quentin Lhoest","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021727268","display_name":"A. Villanova del Moral","orcid":"https://orcid.org/0000-0003-1727-1045"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Albert Villanova del Moral","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000126238","display_name":"Yacine Jernite","orcid":"https://orcid.org/0000-0002-8053-6862"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yacine Jernite","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107980345","display_name":"Abhishek Thakur","orcid":"https://orcid.org/0000-0003-4149-1312"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abhishek Thakur","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025097230","display_name":"Patrick von Platen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Patrick von Platen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043714535","display_name":"Suraj Patil","orcid":"https://orcid.org/0009-0005-2486-0544"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Suraj Patil","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038505596","display_name":"Julien Chaumond","orcid":"https://orcid.org/0000-0003-3188-1616"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Julien Chaumond","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051831524","display_name":"Mariama Drame","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mariama Drame","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057464576","display_name":"Julien Plu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Julien Plu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063084634","display_name":"Lewis Tunstall","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lewis Tunstall","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058679972","display_name":"Joe Davison","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Joe Davison","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075136074","display_name":"Mario \u0160a\u0161ko","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mario \u0160a\u0161ko","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069149197","display_name":"Gunjan Chhablani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gunjan Chhablani","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070126273","display_name":"Bhavitvya Malik","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhavitvya Malik","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016319533","display_name":"Simon Brandeis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Simon Brandeis","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084957527","display_name":"Teven Le Scao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Teven Le Scao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049805631","display_name":"Victor Sanh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Victor Sanh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102941860","display_name":"Canwen Xu","orcid":"https://orcid.org/0000-0002-1552-999X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Canwen Xu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059947211","display_name":"Nicolas Patry","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nicolas Patry","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063040968","display_name":"Angelina McMillan-Major","orcid":"https://orcid.org/0000-0003-2257-9618"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Angelina McMillan-Major","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113496357","display_name":"Philipp Schmid","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Philipp Schmid","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041801887","display_name":"Sylvain Gugger","orcid":"https://orcid.org/0000-0001-8056-2713"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sylvain Gugger","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009717413","display_name":"Cl\u00e9ment Delangue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cl\u00e9ment Delangue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046258903","display_name":"Th\u00e9o Matussi\u00e8re","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Th\u00e9o Matussi\u00e8re","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069696966","display_name":"Lysandre Debut","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lysandre Debut","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079005032","display_name":"Stas Bekman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stas Bekman","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027534072","display_name":"Pierric Cistac","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pierric Cistac","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073755325","display_name":"Thibault Goehringer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Thibault Goehringer","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038928331","display_name":"Victor Mustar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Victor Mustar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076325114","display_name":"Fran\u00e7ois Lagunas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fran\u00e7ois Lagunas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062546146","display_name":"Alexander M. Rush","orcid":"https://orcid.org/0000-0002-9900-1606"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alexander Rush","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5107899645","display_name":"Thomas Wolf","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Thomas Wolf","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"fulltext_origin":"pdf","cited_by_count":253,"citation_normalized_percentile":{"value":0.999952,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Natural Language Processing","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Natural Language Processing","score":0.9999,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Statistical Machine Translation and Natural Language Processing","score":0.9992,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Automatic Keyword Extraction from Textual Data","score":0.9755,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/language-modeling","display_name":"Language Modeling","score":0.561224},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine Translation","score":0.551135},{"id":"https://openalex.org/keywords/neural-machine-translation","display_name":"Neural Machine Translation","score":0.53545},{"id":"https://openalex.org/keywords/word-representation","display_name":"Word Representation","score":0.529097},{"id":"https://openalex.org/keywords/multilingual-neural-machine-translation","display_name":"Multilingual Neural Machine Translation","score":0.522953}],"concepts":[{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.4523774},{"id":"https://openalex.org/C52119013","wikidata":"https://www.wikidata.org/wiki/Q50637","display_name":"Art history","level":1,"score":0.42683083},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.34201485}],"mesh":[],"locations_count":2,"locations":[{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2021.emnlp-demo.21","pdf_url":"https://aclanthology.org/2021.emnlp-demo.21.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2109.02846","pdf_url":"https://arxiv.org/pdf/2109.02846","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2021.emnlp-demo.21","pdf_url":"https://aclanthology.org/2021.emnlp-demo.21.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":45,"referenced_works":["https://openalex.org/W1089141","https://openalex.org/W1632114991","https://openalex.org/W2048390999","https://openalex.org/W2093664665","https://openalex.org/W2098921539","https://openalex.org/W2143017621","https://openalex.org/W2395259056","https://openalex.org/W2579343286","https://openalex.org/W2593864460","https://openalex.org/W2767899794","https://openalex.org/W2795038878","https://openalex.org/W2809324505","https://openalex.org/W2911227954","https://openalex.org/W2923014074","https://openalex.org/W2950681488","https://openalex.org/W2951299559","https://openalex.org/W2962736243","https://openalex.org/W2962739339","https://openalex.org/W2962843521","https://openalex.org/W2963310665","https://openalex.org/W2963341956","https://openalex.org/W2963506925","https://openalex.org/W2963661177","https://openalex.org/W2963748441","https://openalex.org/W3027879771","https://openalex.org/W3035296331","https://openalex.org/W3082274269","https://openalex.org/W3098903812","https://openalex.org/W3107298362","https://openalex.org/W3120706522","https://openalex.org/W3127861905","https://openalex.org/W3135371071","https://openalex.org/W3137010024","https://openalex.org/W3169841173","https://openalex.org/W3172794097","https://openalex.org/W3173247149","https://openalex.org/W3186655327","https://openalex.org/W3193521099","https://openalex.org/W4251372957","https://openalex.org/W4287116725","https://openalex.org/W4288089799","https://openalex.org/W4292779060","https://openalex.org/W4293350112","https://openalex.org/W4295601746","https://openalex.org/W4299585995"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3193615524","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W2748952813","https://openalex.org/W1531601525"],"abstract_inverted_index":{"Quentin":[0],"Lhoest,":[1],"Albert":[2],"Villanova":[3],"del":[4],"Moral,":[5],"Yacine":[6],"Jernite,":[7],"Abhishek":[8],"Thakur,":[9],"Patrick":[10],"von":[11],"Platen,":[12],"Suraj":[13],"Patil,":[14],"Julien":[15,19],"Chaumond,":[16],"Mariama":[17],"Drame,":[18],"Plu,":[20],"Lewis":[21],"Tunstall,":[22],"Joe":[23],"Davison,":[24],"Mario":[25],"\u0160a\u0161ko,":[26],"Gunjan":[27],"Chhablani,":[28],"Bhavitvya":[29],"Malik,":[30],"Simon":[31],"Brandeis,":[32],"Teven":[33],"Le":[34],"Scao,":[35],"Victor":[36,60],"Sanh,":[37],"Canwen":[38],"Xu,":[39],"Nicolas":[40],"Patry,":[41],"Angelina":[42],"McMillan-Major,":[43],"Philipp":[44],"Schmid,":[45],"Sylvain":[46],"Gugger,":[47],"Cl\u00e9ment":[48],"Delangue,":[49],"Th\u00e9o":[50],"Matussi\u00e8re,":[51],"Lysandre":[52],"Debut,":[53],"Stas":[54],"Bekman,":[55],"Pierric":[56],"Cistac,":[57],"Thibault":[58],"Goehringer,":[59],"Mustar,":[61],"Fran\u00e7ois":[62],"Lagunas,":[63],"Alexander":[64],"Rush,":[65],"Thomas":[66],"Wolf.":[67],"Proceedings":[68],"of":[69],"the":[70],"2021":[71],"Conference":[72],"on":[73],"Empirical":[74],"Methods":[75],"in":[76],"Natural":[77],"Language":[78],"Processing:":[79],"System":[80],"Demonstrations.":[81],"2021.":[82]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W3197876970","counts_by_year":[{"year":2024,"cited_by_count":19},{"year":2023,"cited_by_count":147},{"year":2022,"cited_by_count":78},{"year":2021,"cited_by_count":8}],"updated_date":"2024-11-05T19:38:59.216941","created_date":"2021-09-13"}