@inproceedings{jasonarson-etal-2024-cogs,
title = "Cogs in a Machine, Doing What They{'}re Meant to Do {--} the {AMI} Submission to the {WMT}24 General Translation Task",
author = "Jasonarson, Atli and
Hafsteinsson, Hinrik and
{\'A}rmannsson, Bjarki and
Steingr{\'\i}msson, Steinth{\'o}r",
editor = "Haddow, Barry and
Kocmi, Tom and
Koehn, Philipp and
Monz, Christof",
booktitle = "Proceedings of the Ninth Conference on Machine Translation",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.wmt-1.18",
doi = "10.18653/v1/2024.wmt-1.18",
pages = "253--262",
abstract = "This paper presents the submission of the Arni Magnusson Institute{'}s team to the WMT24 General translation task. We work on the English→Icelandic translation direction. Our system comprises four translation models and a grammar correction model. For training our systems we carefully curate our datasets, aggressively filtering out sentence pairs that may detrimentally affect the quality of our systems output. Some of our data are collected from human translations and some are synthetically generated. A part of the synthetic data is generated using an LLM, and we find that it increases the translation capability of our system significantly.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="jasonarson-etal-2024-cogs">
<titleInfo>
<title>Cogs in a Machine, Doing What They’re Meant to Do – the AMI Submission to the WMT24 General Translation Task</title>
</titleInfo>
<name type="personal">
<namePart type="given">Atli</namePart>
<namePart type="family">Jasonarson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Hinrik</namePart>
<namePart type="family">Hafsteinsson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Bjarki</namePart>
<namePart type="family">Ármannsson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Steinthór</namePart>
<namePart type="family">Steingrímsson</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2024-11</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Ninth Conference on Machine Translation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Barry</namePart>
<namePart type="family">Haddow</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Tom</namePart>
<namePart type="family">Kocmi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Philipp</namePart>
<namePart type="family">Koehn</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Christof</namePart>
<namePart type="family">Monz</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Miami, Florida, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This paper presents the submission of the Arni Magnusson Institute’s team to the WMT24 General translation task. We work on the English→Icelandic translation direction. Our system comprises four translation models and a grammar correction model. For training our systems we carefully curate our datasets, aggressively filtering out sentence pairs that may detrimentally affect the quality of our systems output. Some of our data are collected from human translations and some are synthetically generated. A part of the synthetic data is generated using an LLM, and we find that it increases the translation capability of our system significantly.</abstract>
<identifier type="citekey">jasonarson-etal-2024-cogs</identifier>
<identifier type="doi">10.18653/v1/2024.wmt-1.18</identifier>
<location>
<url>https://aclanthology.org/2024.wmt-1.18</url>
</location>
<part>
<date>2024-11</date>
<extent unit="page">
<start>253</start>
<end>262</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Cogs in a Machine, Doing What They’re Meant to Do – the AMI Submission to the WMT24 General Translation Task
%A Jasonarson, Atli
%A Hafsteinsson, Hinrik
%A Ármannsson, Bjarki
%A Steingrímsson, Steinthór
%Y Haddow, Barry
%Y Kocmi, Tom
%Y Koehn, Philipp
%Y Monz, Christof
%S Proceedings of the Ninth Conference on Machine Translation
%D 2024
%8 November
%I Association for Computational Linguistics
%C Miami, Florida, USA
%F jasonarson-etal-2024-cogs
%X This paper presents the submission of the Arni Magnusson Institute’s team to the WMT24 General translation task. We work on the English→Icelandic translation direction. Our system comprises four translation models and a grammar correction model. For training our systems we carefully curate our datasets, aggressively filtering out sentence pairs that may detrimentally affect the quality of our systems output. Some of our data are collected from human translations and some are synthetically generated. A part of the synthetic data is generated using an LLM, and we find that it increases the translation capability of our system significantly.
%R 10.18653/v1/2024.wmt-1.18
%U https://aclanthology.org/2024.wmt-1.18
%U https://doi.org/10.18653/v1/2024.wmt-1.18
%P 253-262
Markdown (Informal)
[Cogs in a Machine, Doing What They’re Meant to Do – the AMI Submission to the WMT24 General Translation Task](https://aclanthology.org/2024.wmt-1.18) (Jasonarson et al., WMT 2024)
ACL