@inproceedings{karimova-etal-2014-offline,
title = "Offline extraction of overlapping phrases for hierarchical phrase-based translation",
author = "Karimova, Sariya and
Simianer, Patrick and
Riezler, Stefan",
editor = {Federico, Marcello and
St{\"u}ker, Sebastian and
Yvon, Fran{\c{c}}ois},
booktitle = "Proceedings of the 11th International Workshop on Spoken Language Translation: Papers",
month = dec # " 4-5",
year = "2014",
address = "Lake Tahoe, California",
url = "https://aclanthology.org/2014.iwslt-papers.12/",
pages = "236--243",
abstract = "Standard SMT decoders operate by translating disjoint spans of input words, thus discarding information in form of overlapping phrases that is present at phrase extraction time. The use of overlapping phrases in translation may enhance fluency in positions that would otherwise be phrase boundaries, they may provide additional statistical support for long and rare phrases, and they may generate new phrases that have never been seen in the training data. We show how to extract overlapping phrases offline for hierarchical phrasebased SMT, and how to extract features and tune weights for the new phrases. We find gains of 0.3 {\ensuremath{-}} 0.6 BLEU points over discriminatively trained hierarchical phrase-based SMT systems on two datasets for German-to-English translation."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="karimova-etal-2014-offline">
<titleInfo>
<title>Offline extraction of overlapping phrases for hierarchical phrase-based translation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Sariya</namePart>
<namePart type="family">Karimova</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Patrick</namePart>
<namePart type="family">Simianer</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Stefan</namePart>
<namePart type="family">Riezler</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2014-dec 4-5</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 11th International Workshop on Spoken Language Translation: Papers</title>
</titleInfo>
<name type="personal">
<namePart type="given">Marcello</namePart>
<namePart type="family">Federico</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Sebastian</namePart>
<namePart type="family">Stüker</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">François</namePart>
<namePart type="family">Yvon</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<place>
<placeTerm type="text">Lake Tahoe, California</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Standard SMT decoders operate by translating disjoint spans of input words, thus discarding information in form of overlapping phrases that is present at phrase extraction time. The use of overlapping phrases in translation may enhance fluency in positions that would otherwise be phrase boundaries, they may provide additional statistical support for long and rare phrases, and they may generate new phrases that have never been seen in the training data. We show how to extract overlapping phrases offline for hierarchical phrasebased SMT, and how to extract features and tune weights for the new phrases. We find gains of 0.3 \ensuremath- 0.6 BLEU points over discriminatively trained hierarchical phrase-based SMT systems on two datasets for German-to-English translation.</abstract>
<identifier type="citekey">karimova-etal-2014-offline</identifier>
<location>
<url>https://aclanthology.org/2014.iwslt-papers.12/</url>
</location>
<part>
<date>2014-dec 4-5</date>
<extent unit="page">
<start>236</start>
<end>243</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Offline extraction of overlapping phrases for hierarchical phrase-based translation
%A Karimova, Sariya
%A Simianer, Patrick
%A Riezler, Stefan
%Y Federico, Marcello
%Y Stüker, Sebastian
%Y Yvon, François
%S Proceedings of the 11th International Workshop on Spoken Language Translation: Papers
%D 2014
%8 dec 4 5
%C Lake Tahoe, California
%F karimova-etal-2014-offline
%X Standard SMT decoders operate by translating disjoint spans of input words, thus discarding information in form of overlapping phrases that is present at phrase extraction time. The use of overlapping phrases in translation may enhance fluency in positions that would otherwise be phrase boundaries, they may provide additional statistical support for long and rare phrases, and they may generate new phrases that have never been seen in the training data. We show how to extract overlapping phrases offline for hierarchical phrasebased SMT, and how to extract features and tune weights for the new phrases. We find gains of 0.3 \ensuremath- 0.6 BLEU points over discriminatively trained hierarchical phrase-based SMT systems on two datasets for German-to-English translation.
%U https://aclanthology.org/2014.iwslt-papers.12/
%P 236-243
Markdown (Informal)
[Offline extraction of overlapping phrases for hierarchical phrase-based translation](https://aclanthology.org/2014.iwslt-papers.12/) (Karimova et al., IWSLT 2014)
ACL