dc.contributor.author | Estarrona Ibarloza, Ainara | |
dc.contributor.author | Etxeberria Uztarroz, Izaskun | |
dc.contributor.author | Etxepare Igiñiz, Ricardo | |
dc.contributor.author | Padilla Moyano, Manuel | |
dc.contributor.author | Soraluze Irureta, Ander | |
dc.date.accessioned | 2024-10-14T17:24:12Z | |
dc.date.available | 2024-10-14T17:24:12Z | |
dc.date.issued | 2020-12 | |
dc.identifier.citation | Proceedings of the 7th Workshop on NLP for Similar Languages, Varieties and Dialects : 79-89 (2020) | es_ES |
dc.identifier.uri | http://hdl.handle.net/10810/69931 | |
dc.description.abstract | This paper analyses the challenge of working with dialectal variation when semi-automatically normalising and analysing historical Basque texts. This work is part of a more general ongoing project for the construction of a morphosyntactically annotated historical corpus of Basque called Basque in the Making (BIM): A Historical Look at a European Language Isolate, whose main objective is the systematic and diachronic study of a number of grammatical features. This will be not only the first tagged corpus of historical Basque, but also a means to improve language processing tools by analysing historical Basque varieties more or less distant from present-day standard Basque. | es_ES |
dc.description.sponsorship | Agence Nationale de la Recherche [ANR-17-CE27-0011-BIM]. MINECO [FFI2016-76032-P; RTI2018-098082-J-I00]. Gobierno Vasco [GIC IT1344-19]. | es_ES |
dc.language.iso | eng | es_ES |
dc.publisher | International Committee on Computational Linguistics (ICCL) | es_ES |
dc.rights | info:eu-repo/semantics/openAccess | es_ES |
dc.rights.uri | http://creativecommons.org/licenses/by/4.0/ | * |
dc.subject | text normalisation | es_ES |
dc.subject | digital humanities | es_ES |
dc.subject | historical corpus | es_ES |
dc.subject | diachronic syntax | es_ES |
dc.subject | dialectal variation | es_ES |
dc.title | Dealing with dialectal variation in the construction of the Basque historical corpus | es_ES |
dc.type | info:eu-repo/semantics/conferenceObject | es_ES |
dc.rights.holder | (cc) 2020 The authorslicensed under a Creative Commons Attribution 4.0 International Licence. | es_ES |
dc.relation.publisherversion | https://aclanthology.org/2020.vardial-1.8/ | es_ES |
dc.departamentoes | Lingüística y estudios vascos | es_ES |
dc.departamentoeu | Hizkuntzalaritza eta euskal ikasketak | es_ES |