dc.date.accessioned | 2024-02-06T18:11:23Z | |
dc.date.available | 2024-02-06T18:11:23Z | |
dc.date.created | 2023-06-13T16:19:40Z | |
dc.date.issued | 2023 | |
dc.identifier.citation | Kolesnichenko, Larisa Velldal, Erik Øvrelid, Lilja . Word Substitution with Masked Language Models as Data Augmentation for Sentiment Analysis. Proceedings of the Second Workshop on Resources and Representations for Under-Resourced Languages and Domains (RESOURCEFUL-2023). 2023 Association for Computational Linguistics | |
dc.identifier.uri | http://hdl.handle.net/10852/107608 | |
dc.description.abstract | This paper explores the use of masked language modeling (MLM) for data augmentation (DA), targeting structured sentiment analysis (SSA) for Norwegian based on a dataset of annotated reviews. Considering the limited resources for Norwegian language and the complexity of the annotation task, the aim is to investigate whether this approach to data augmentation can help boost the performance. We report on experiments with substituting words both inside and outside of sentiment annotations, and we also present an error analysis, discussing some of the potential pitfalls of using MLM-based DA for SSA, and suggest directions for future work. | |
dc.language | EN | |
dc.publisher | Association for Computational Linguistics | |
dc.rights | Attribution 4.0 International | |
dc.rights.uri | https://creativecommons.org/licenses/by/4.0/ | |
dc.title | Word Substitution with Masked Language Models as Data Augmentation for Sentiment Analysis | |
dc.title.alternative | ENEngelskEnglishWord Substitution with Masked Language Models as Data Augmentation for Sentiment Analysis | |
dc.type | Chapter | |
dc.creator.author | Kolesnichenko, Larisa | |
dc.creator.author | Velldal, Erik | |
dc.creator.author | Øvrelid, Lilja | |
cristin.unitcode | 185,15,5,48 | |
cristin.unitname | Forskningsgruppen for språkteknologi | |
cristin.ispublished | true | |
cristin.fulltext | original | |
dc.identifier.cristin | 2154216 | |
dc.identifier.bibliographiccitation | info:ofi/fmt:kev:mtx:ctx&ctx_ver=Z39.88-2004&rft_val_fmt=info:ofi/fmt:kev:mtx:book&rft.btitle=Proceedings of the Second Workshop on Resources and Representations for Under-Resourced Languages and Domains (RESOURCEFUL-2023)&rft.spage=&rft.date=2023 | |
dc.identifier.startpage | 42 | |
dc.identifier.endpage | 47 | |
dc.identifier.pagecount | 150 | |
dc.subject.nvi | VDP::Annen informasjonsteknologi: 559 | |
dc.type.document | Bokkapittel | |
dc.type.peerreviewed | Peer reviewed | |
dc.source.isbn | 978-1-959429-73-9 | |
dc.type.version | PublishedVersion | |
cristin.btitle | Proceedings of the Second Workshop on Resources and Representations for Under-Resourced Languages and Domains (RESOURCEFUL-2023) | |
dc.relation.project | NFR/270908 | |