@inproceedings{sellami-etal-2012-exploiting,
title = "Exploiting {W}ikipedia as a Knowledge Base for the Extraction of Linguistic Resources: Application on {A}rabic-{F}rench Comparable Corpora and Bilingual Lexicons",
author = "Sellami, Rahma and
Sadat, Fatiha and
Hadrich Belguith, Lamia",
editor = "Farghaly, Ali and
Oroumchian, Farhad",
booktitle = "Fourth Workshop on Computational Approaches to Arabic-Script-based Languages",
month = nov # " 1",
year = "2012",
address = "San Diego, California, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2012.amta-caas14.10/",
pages = "72--79",
abstract = "We present simple and effective methods for extracting comparable corpora and bilingual lexicons from Wikipedia. We shall exploit the large scale and the structure of Wikipedia articles to extract two resources that will be very useful for natural language applications. We build a comparable corpus from Wikipedia using categories as topic restrictions and we extract bilingual lexicons from inter-language links aligned with statistical method or a combined statistical and linguistic method."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="sellami-etal-2012-exploiting">
<titleInfo>
<title>Exploiting Wikipedia as a Knowledge Base for the Extraction of Linguistic Resources: Application on Arabic-French Comparable Corpora and Bilingual Lexicons</title>
</titleInfo>
<name type="personal">
<namePart type="given">Rahma</namePart>
<namePart type="family">Sellami</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Fatiha</namePart>
<namePart type="family">Sadat</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Lamia</namePart>
<namePart type="family">Hadrich Belguith</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2012-nov 1</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Fourth Workshop on Computational Approaches to Arabic-Script-based Languages</title>
</titleInfo>
<name type="personal">
<namePart type="given">Ali</namePart>
<namePart type="family">Farghaly</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Farhad</namePart>
<namePart type="family">Oroumchian</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Machine Translation in the Americas</publisher>
<place>
<placeTerm type="text">San Diego, California, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>We present simple and effective methods for extracting comparable corpora and bilingual lexicons from Wikipedia. We shall exploit the large scale and the structure of Wikipedia articles to extract two resources that will be very useful for natural language applications. We build a comparable corpus from Wikipedia using categories as topic restrictions and we extract bilingual lexicons from inter-language links aligned with statistical method or a combined statistical and linguistic method.</abstract>
<identifier type="citekey">sellami-etal-2012-exploiting</identifier>
<location>
<url>https://aclanthology.org/2012.amta-caas14.10/</url>
</location>
<part>
<date>2012-nov 1</date>
<extent unit="page">
<start>72</start>
<end>79</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Exploiting Wikipedia as a Knowledge Base for the Extraction of Linguistic Resources: Application on Arabic-French Comparable Corpora and Bilingual Lexicons
%A Sellami, Rahma
%A Sadat, Fatiha
%A Hadrich Belguith, Lamia
%Y Farghaly, Ali
%Y Oroumchian, Farhad
%S Fourth Workshop on Computational Approaches to Arabic-Script-based Languages
%D 2012
%8 nov 1
%I Association for Machine Translation in the Americas
%C San Diego, California, USA
%F sellami-etal-2012-exploiting
%X We present simple and effective methods for extracting comparable corpora and bilingual lexicons from Wikipedia. We shall exploit the large scale and the structure of Wikipedia articles to extract two resources that will be very useful for natural language applications. We build a comparable corpus from Wikipedia using categories as topic restrictions and we extract bilingual lexicons from inter-language links aligned with statistical method or a combined statistical and linguistic method.
%U https://aclanthology.org/2012.amta-caas14.10/
%P 72-79
Markdown (Informal)
[Exploiting Wikipedia as a Knowledge Base for the Extraction of Linguistic Resources: Application on Arabic-French Comparable Corpora and Bilingual Lexicons](https://aclanthology.org/2012.amta-caas14.10/) (Sellami et al., AMTA 2012)
ACL