dc.contributor.author | Kurimo, Mikko | |
dc.contributor.author | Getman, Yaroslav | |
dc.contributor.author | Voskoboinik, Ekaterina | |
dc.contributor.author | Al-Ghezi, Ragheb | |
dc.contributor.author | Kallio, Heini | |
dc.contributor.author | Kuronen, Mikko | |
dc.contributor.author | von Zansen, Anna | |
dc.contributor.author | Hilden, Raili | |
dc.contributor.author | Kronholm, Sirkku | |
dc.contributor.author | Huhta, Ari | |
dc.contributor.author | Linden, Krister | |
dc.date.accessioned | 2023-09-01T10:57:05Z | |
dc.date.available | 2023-09-01T10:57:05Z | |
dc.date.issued | 2023 | |
dc.identifier.citation | Kurimo, M., Getman, Y., Voskoboinik, E., Al-Ghezi, R., Kallio, H., Kuronen, M., von Zansen, A., Hilden, R., Kronholm, S., Huhta, A., & Linden, K. (2023). New data, benchmark and baseline for L2 speaking assessment for low-resoure languages. In <i>Proceedings of the 9th Workshop on Speech and Language Technology in Education (SLaTE) </i> (pp. 166-170). International Speech Communication Association. <a href="https://doi.org/10.21437/SLaTE.2023-32" target="_blank">https://doi.org/10.21437/SLaTE.2023-32</a> | |
dc.identifier.other | CONVID_184436350 | |
dc.identifier.uri | https://jyx.jyu.fi/handle/123456789/88853 | |
dc.description.abstract | The development of large multilingual speech models provides the possibility to construct high-quality speech technology even for low-resource languages. In this paper, we present the speech data of L2 learners of Finnish and Finland Swedish that we have recently collected for training and evaluation of automatic speech recognition (ASR) and speaking assessment (ASA). It includes over 4000 recordings by over 300 students per language in short read-aloud and free-form tasks. The recordings have been manually transcribed and assessed for pronunciation, fluency, range, accuracy, task achievement, and a holistic proficiency level. We present also an ASR and ASA benchmarking setup we have constructed using this data and include results from our baseline systems built by fine-tuning self-supervised multilingual model for the target language. In addition to benchmarking, our baseline system can be used by L2 students and teachers for online self-training and evaluation of oral proficiency. | en |
dc.format.extent | 186 | |
dc.format.mimetype | application/pdf | |
dc.language.iso | eng | |
dc.publisher | International Speech Communication Association | |
dc.relation.ispartof | Proceedings of the 9th Workshop on Speech and Language Technology in Education (SLaTE) | |
dc.rights | In Copyright | |
dc.subject.other | puhemallit | |
dc.subject.other | ASR | |
dc.subject.other | L2 speaking assessment | |
dc.subject.other | wav2vec2.0 | |
dc.subject.other | low-resource languages | |
dc.title | New data, benchmark and baseline for L2 speaking assessment for low-resoure languages | |
dc.type | conferenceObject | |
dc.identifier.urn | URN:NBN:fi:jyu-202309014887 | |
dc.contributor.laitos | Soveltavan kielentutkimuksen keskus | fi |
dc.contributor.laitos | Kieli- ja viestintätieteiden laitos | fi |
dc.contributor.laitos | Centre for Applied Language Studies | en |
dc.contributor.laitos | Department of Language and Communication Studies | en |
dc.contributor.oppiaine | Soveltava kielentutkimus | fi |
dc.contributor.oppiaine | Ruotsin kieli | fi |
dc.contributor.oppiaine | Hyvinvoinnin tutkimuksen yhteisö | fi |
dc.contributor.oppiaine | Suomen kieli | fi |
dc.contributor.oppiaine | Applied language studies | en |
dc.contributor.oppiaine | Swedish | en |
dc.contributor.oppiaine | School of Wellbeing | en |
dc.contributor.oppiaine | Finnish | en |
dc.type.uri | http://purl.org/eprint/type/ConferencePaper | |
dc.type.coar | http://purl.org/coar/resource_type/c_5794 | |
dc.description.reviewstatus | nonPeerReviewed | |
dc.format.pagerange | 166-170 | |
dc.type.version | publishedVersion | |
dc.rights.copyright | © 2023 International Speech Communication Association | |
dc.rights.accesslevel | openAccess | fi |
dc.relation.conference | Workshop on Speech and Language Technology in Education | |
dc.relation.grantnumber | 322965 | |
dc.subject.yso | suomi toisena kielenä | |
dc.subject.yso | suomenruotsi | |
dc.subject.yso | arviointi | |
dc.subject.yso | puheentunnistus | |
dc.subject.yso | toinen kieli | |
dc.subject.yso | ruotsi toisena kielenä | |
dc.subject.yso | monikielisyys | |
dc.subject.yso | kielen oppiminen | |
dc.subject.yso | suullinen kielitaito | |
dc.subject.yso | puhe (puhuminen) | |
dc.format.content | fulltext | |
jyx.subject.uri | http://www.yso.fi/onto/yso/p24613 | |
jyx.subject.uri | http://www.yso.fi/onto/yso/p12864 | |
jyx.subject.uri | http://www.yso.fi/onto/yso/p7413 | |
jyx.subject.uri | http://www.yso.fi/onto/yso/p8264 | |
jyx.subject.uri | http://www.yso.fi/onto/yso/p17005 | |
jyx.subject.uri | http://www.yso.fi/onto/yso/p24614 | |
jyx.subject.uri | http://www.yso.fi/onto/yso/p6720 | |
jyx.subject.uri | http://www.yso.fi/onto/yso/p24061 | |
jyx.subject.uri | http://www.yso.fi/onto/yso/p17782 | |
jyx.subject.uri | http://www.yso.fi/onto/yso/p2492 | |
dc.rights.url | http://rightsstatements.org/page/InC/1.0/?language=en | |
dc.relation.doi | 10.21437/SLaTE.2023-32 | |
dc.relation.funder | Research Council of Finland | en |
dc.relation.funder | Suomen Akatemia | fi |
jyx.fundingprogram | Academy Project, AoF | en |
jyx.fundingprogram | Akatemiahanke, SA | fi |
jyx.fundinginformation | This work was done and the data were collected as part of the Academy of Finland grants number 322619, 322625, 322965 and 337073. | |
dc.type.okm | D3 | |