@inproceedings{pintard-francois-2020-combining,
title = "Combining Expert Knowledge with Frequency Information to Infer {CEFR} Levels for Words",
author = "Pintard, Alice and
Fran{\c{c}}ois, Thomas",
editor = "Gala, N{\'u}ria and
Wilkens, Rodrigo",
booktitle = "Proceedings of the 1st Workshop on Tools and Resources to Empower People with REAding DIfficulties (READI)",
month = may,
year = "2020",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://aclanthology.org/2020.readi-1.13",
pages = "85--92",
abstract = "Traditional approaches to set goals in second language (L2) vocabulary acquisition relied either on word lists that were obtained from large L1 corpora or on collective knowledge and experience of L2 experts, teachers, and examiners. Both approaches are known to offer some advantages, but also to have some limitations. In this paper, we try to combine both sources of information, namely the official reference level description for French language and the FLElex lexical database. Our aim is to train a statistical model on the French RLD that would be able to turn the distributional information from FLElex into one of the six levels of the Common European Framework of Reference for languages (CEFR). We show that such approach yields a gain of 29{\%} in accuracy compared to the method currently used in the CEFRLex project. Besides, our experiments also offer deeper insights into the advantages and shortcomings of the two traditional sources of information (frequency vs. expert knowledge).",
language = "English",
ISBN = "979-10-95546-45-0",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="pintard-francois-2020-combining">
<titleInfo>
<title>Combining Expert Knowledge with Frequency Information to Infer CEFR Levels for Words</title>
</titleInfo>
<name type="personal">
<namePart type="given">Alice</namePart>
<namePart type="family">Pintard</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Thomas</namePart>
<namePart type="family">François</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2020-05</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<language>
<languageTerm type="text">English</languageTerm>
<languageTerm type="code" authority="iso639-2b">eng</languageTerm>
</language>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 1st Workshop on Tools and Resources to Empower People with REAding DIfficulties (READI)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Núria</namePart>
<namePart type="family">Gala</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Rodrigo</namePart>
<namePart type="family">Wilkens</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>European Language Resources Association</publisher>
<place>
<placeTerm type="text">Marseille, France</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-10-95546-45-0</identifier>
</relatedItem>
<abstract>Traditional approaches to set goals in second language (L2) vocabulary acquisition relied either on word lists that were obtained from large L1 corpora or on collective knowledge and experience of L2 experts, teachers, and examiners. Both approaches are known to offer some advantages, but also to have some limitations. In this paper, we try to combine both sources of information, namely the official reference level description for French language and the FLElex lexical database. Our aim is to train a statistical model on the French RLD that would be able to turn the distributional information from FLElex into one of the six levels of the Common European Framework of Reference for languages (CEFR). We show that such approach yields a gain of 29% in accuracy compared to the method currently used in the CEFRLex project. Besides, our experiments also offer deeper insights into the advantages and shortcomings of the two traditional sources of information (frequency vs. expert knowledge).</abstract>
<identifier type="citekey">pintard-francois-2020-combining</identifier>
<location>
<url>https://aclanthology.org/2020.readi-1.13</url>
</location>
<part>
<date>2020-05</date>
<extent unit="page">
<start>85</start>
<end>92</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Combining Expert Knowledge with Frequency Information to Infer CEFR Levels for Words
%A Pintard, Alice
%A François, Thomas
%Y Gala, Núria
%Y Wilkens, Rodrigo
%S Proceedings of the 1st Workshop on Tools and Resources to Empower People with REAding DIfficulties (READI)
%D 2020
%8 May
%I European Language Resources Association
%C Marseille, France
%@ 979-10-95546-45-0
%G English
%F pintard-francois-2020-combining
%X Traditional approaches to set goals in second language (L2) vocabulary acquisition relied either on word lists that were obtained from large L1 corpora or on collective knowledge and experience of L2 experts, teachers, and examiners. Both approaches are known to offer some advantages, but also to have some limitations. In this paper, we try to combine both sources of information, namely the official reference level description for French language and the FLElex lexical database. Our aim is to train a statistical model on the French RLD that would be able to turn the distributional information from FLElex into one of the six levels of the Common European Framework of Reference for languages (CEFR). We show that such approach yields a gain of 29% in accuracy compared to the method currently used in the CEFRLex project. Besides, our experiments also offer deeper insights into the advantages and shortcomings of the two traditional sources of information (frequency vs. expert knowledge).
%U https://aclanthology.org/2020.readi-1.13
%P 85-92
Markdown (Informal)
[Combining Expert Knowledge with Frequency Information to Infer CEFR Levels for Words](https://aclanthology.org/2020.readi-1.13) (Pintard & François, READI 2020)
ACL