@inproceedings{macaire-etal-2022-automatic,
title = "Automatic Speech Recognition and Query By Example for Creole Languages Documentation",
author = "Macaire, C{\'e}cile and
Schwab, Didier and
Lecouteux, Benjamin and
Schang, Emmanuel",
editor = "Muresan, Smaranda and
Nakov, Preslav and
Villavicencio, Aline",
booktitle = "Findings of the Association for Computational Linguistics: ACL 2022",
month = may,
year = "2022",
address = "Dublin, Ireland",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.findings-acl.197",
doi = "10.18653/v1/2022.findings-acl.197",
pages = "2512--2520",
abstract = "We investigate the exploitation of self-supervised models for two Creole languages with few resources: Gwadloup{\'e}yen and Morisien. Automatic language processing tools are almost non-existent for these two languages. We propose to use about one hour of annotated data to design an automatic speech recognition system for each language. We evaluate how much data is needed to obtain a query-by-example system that is usable by linguists. Moreover, our experiments show that multilingual self-supervised models are not necessarily the most efficient for Creole languages.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="macaire-etal-2022-automatic">
<titleInfo>
<title>Automatic Speech Recognition and Query By Example for Creole Languages Documentation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Cécile</namePart>
<namePart type="family">Macaire</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Didier</namePart>
<namePart type="family">Schwab</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Benjamin</namePart>
<namePart type="family">Lecouteux</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Emmanuel</namePart>
<namePart type="family">Schang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2022-05</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Findings of the Association for Computational Linguistics: ACL 2022</title>
</titleInfo>
<name type="personal">
<namePart type="given">Smaranda</namePart>
<namePart type="family">Muresan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Preslav</namePart>
<namePart type="family">Nakov</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Aline</namePart>
<namePart type="family">Villavicencio</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Dublin, Ireland</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>We investigate the exploitation of self-supervised models for two Creole languages with few resources: Gwadloupéyen and Morisien. Automatic language processing tools are almost non-existent for these two languages. We propose to use about one hour of annotated data to design an automatic speech recognition system for each language. We evaluate how much data is needed to obtain a query-by-example system that is usable by linguists. Moreover, our experiments show that multilingual self-supervised models are not necessarily the most efficient for Creole languages.</abstract>
<identifier type="citekey">macaire-etal-2022-automatic</identifier>
<identifier type="doi">10.18653/v1/2022.findings-acl.197</identifier>
<location>
<url>https://aclanthology.org/2022.findings-acl.197</url>
</location>
<part>
<date>2022-05</date>
<extent unit="page">
<start>2512</start>
<end>2520</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Automatic Speech Recognition and Query By Example for Creole Languages Documentation
%A Macaire, Cécile
%A Schwab, Didier
%A Lecouteux, Benjamin
%A Schang, Emmanuel
%Y Muresan, Smaranda
%Y Nakov, Preslav
%Y Villavicencio, Aline
%S Findings of the Association for Computational Linguistics: ACL 2022
%D 2022
%8 May
%I Association for Computational Linguistics
%C Dublin, Ireland
%F macaire-etal-2022-automatic
%X We investigate the exploitation of self-supervised models for two Creole languages with few resources: Gwadloupéyen and Morisien. Automatic language processing tools are almost non-existent for these two languages. We propose to use about one hour of annotated data to design an automatic speech recognition system for each language. We evaluate how much data is needed to obtain a query-by-example system that is usable by linguists. Moreover, our experiments show that multilingual self-supervised models are not necessarily the most efficient for Creole languages.
%R 10.18653/v1/2022.findings-acl.197
%U https://aclanthology.org/2022.findings-acl.197
%U https://doi.org/10.18653/v1/2022.findings-acl.197
%P 2512-2520
Markdown (Informal)
[Automatic Speech Recognition and Query By Example for Creole Languages Documentation](https://aclanthology.org/2022.findings-acl.197) (Macaire et al., Findings 2022)
ACL