@inproceedings{kao-etal-2008-rapid,
title = "Rapid development of an {E}nglish/{F}arsi speech-to-speech translation system.",
author = "Kao, C.-L. and
Saleem, S. and
Prasad, R. and
Choi, F. and
Natarajan, P. and
Stallard, David and
Krstovski, K. and
Kamali, M.",
booktitle = "Proceedings of the 5th International Workshop on Spoken Language Translation: Papers",
month = oct # " 20-21",
year = "2008",
address = "Waikiki, Hawaii",
url = "https://aclanthology.org/2008.iwslt-papers.4/",
pages = "166--173",
abstract = "Significant advances have been achieved in Speech-to-Speech (S2S) translation systems in recent years. However, rapid configuration of S2S systems for low-resource language pairs and domains remains a challenging problem due to lack of human translated bilingual training data. In this paper, we report on an effort to port our existing English/Iraqi S2S system to the English/Farsi language pair in just 90 days, using only a small amount of training data. This effort included developing acoustic models for Farsi, domain-relevant language models for English and Farsi, and translation models for English-to-Farsi and Farsi-to-English. As part of this work, we developed two novel techniques for expanding the training data, including the reuse of data from different language pairs, and directed collection of new data. In an independent evaluation, the resulting system achieved the highest performance of all systems."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="kao-etal-2008-rapid">
<titleInfo>
<title>Rapid development of an English/Farsi speech-to-speech translation system.</title>
</titleInfo>
<name type="personal">
<namePart type="given">C.-L.</namePart>
<namePart type="family">Kao</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">S</namePart>
<namePart type="family">Saleem</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">R</namePart>
<namePart type="family">Prasad</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">F</namePart>
<namePart type="family">Choi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">P</namePart>
<namePart type="family">Natarajan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">David</namePart>
<namePart type="family">Stallard</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">K</namePart>
<namePart type="family">Krstovski</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">M</namePart>
<namePart type="family">Kamali</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2008-oct 20-21</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 5th International Workshop on Spoken Language Translation: Papers</title>
</titleInfo>
<originInfo>
<place>
<placeTerm type="text">Waikiki, Hawaii</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Significant advances have been achieved in Speech-to-Speech (S2S) translation systems in recent years. However, rapid configuration of S2S systems for low-resource language pairs and domains remains a challenging problem due to lack of human translated bilingual training data. In this paper, we report on an effort to port our existing English/Iraqi S2S system to the English/Farsi language pair in just 90 days, using only a small amount of training data. This effort included developing acoustic models for Farsi, domain-relevant language models for English and Farsi, and translation models for English-to-Farsi and Farsi-to-English. As part of this work, we developed two novel techniques for expanding the training data, including the reuse of data from different language pairs, and directed collection of new data. In an independent evaluation, the resulting system achieved the highest performance of all systems.</abstract>
<identifier type="citekey">kao-etal-2008-rapid</identifier>
<location>
<url>https://aclanthology.org/2008.iwslt-papers.4/</url>
</location>
<part>
<date>2008-oct 20-21</date>
<extent unit="page">
<start>166</start>
<end>173</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Rapid development of an English/Farsi speech-to-speech translation system.
%A Kao, C.-L.
%A Saleem, S.
%A Prasad, R.
%A Choi, F.
%A Natarajan, P.
%A Stallard, David
%A Krstovski, K.
%A Kamali, M.
%S Proceedings of the 5th International Workshop on Spoken Language Translation: Papers
%D 2008
%8 oct 20 21
%C Waikiki, Hawaii
%F kao-etal-2008-rapid
%X Significant advances have been achieved in Speech-to-Speech (S2S) translation systems in recent years. However, rapid configuration of S2S systems for low-resource language pairs and domains remains a challenging problem due to lack of human translated bilingual training data. In this paper, we report on an effort to port our existing English/Iraqi S2S system to the English/Farsi language pair in just 90 days, using only a small amount of training data. This effort included developing acoustic models for Farsi, domain-relevant language models for English and Farsi, and translation models for English-to-Farsi and Farsi-to-English. As part of this work, we developed two novel techniques for expanding the training data, including the reuse of data from different language pairs, and directed collection of new data. In an independent evaluation, the resulting system achieved the highest performance of all systems.
%U https://aclanthology.org/2008.iwslt-papers.4/
%P 166-173
Markdown (Informal)
[Rapid development of an English/Farsi speech-to-speech translation system.](https://aclanthology.org/2008.iwslt-papers.4/) (Kao et al., IWSLT 2008)
ACL
- C.-L. Kao, S. Saleem, R. Prasad, F. Choi, P. Natarajan, David Stallard, K. Krstovski, and M. Kamali. 2008. Rapid development of an English/Farsi speech-to-speech translation system.. In Proceedings of the 5th International Workshop on Spoken Language Translation: Papers, pages 166–173, Waikiki, Hawaii.