@inproceedings{silva-etal-2004-extracting,
title = "Extracting Named Entities. A Statistical Approach",
author = "Silva, Joaquim and
Kozareva, Zornitsa and
Noncheva, Veska and
Lopes, Gabriel",
editor = {Blache, Philippe and
Nguyen, No{\"e}l and
Chenfour, Nouredine and
Rajouani, Abdenbi},
booktitle = "Actes de la 11{\`e}me conf{\'e}rence sur le Traitement Automatique des Langues Naturelles. Posters",
month = apr,
year = "2004",
address = "F{\`e}s, Maroc",
publisher = "ATALA",
url = "https://aclanthology.org/2004.jeptalnrecital-poster.21/",
pages = "125--130",
abstract = "Named entities and more generally Multiword Lexical Units (MWUs) are important for various applications. However, language independent methods for automatically extracting MWUs do not provide us with clean data. So, in this paper we propose a method for selecting possible named entities from automatically extracted MWUs, and later, a statistics-based language independent unsupervised approach is applied to possible named entities in order to cluster them according to their type. Statistical features used by our clustering process are described and motivated. The Model-Based Clustering Analysis (MBCA) software enabled us to obtain different clusters for proposed named entities. The method was applied to Bulgarian and English. For some clusters, precision is very high; other clusters still need further refinement. Based on the obtained clusters, it is also possible to classify new possible named entities."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="silva-etal-2004-extracting">
<titleInfo>
<title>Extracting Named Entities. A Statistical Approach</title>
</titleInfo>
<name type="personal">
<namePart type="given">Joaquim</namePart>
<namePart type="family">Silva</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Zornitsa</namePart>
<namePart type="family">Kozareva</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Veska</namePart>
<namePart type="family">Noncheva</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Gabriel</namePart>
<namePart type="family">Lopes</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2004-04</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Actes de la 11ème conférence sur le Traitement Automatique des Langues Naturelles. Posters</title>
</titleInfo>
<name type="personal">
<namePart type="given">Philippe</namePart>
<namePart type="family">Blache</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Noël</namePart>
<namePart type="family">Nguyen</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Nouredine</namePart>
<namePart type="family">Chenfour</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Abdenbi</namePart>
<namePart type="family">Rajouani</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>ATALA</publisher>
<place>
<placeTerm type="text">Fès, Maroc</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Named entities and more generally Multiword Lexical Units (MWUs) are important for various applications. However, language independent methods for automatically extracting MWUs do not provide us with clean data. So, in this paper we propose a method for selecting possible named entities from automatically extracted MWUs, and later, a statistics-based language independent unsupervised approach is applied to possible named entities in order to cluster them according to their type. Statistical features used by our clustering process are described and motivated. The Model-Based Clustering Analysis (MBCA) software enabled us to obtain different clusters for proposed named entities. The method was applied to Bulgarian and English. For some clusters, precision is very high; other clusters still need further refinement. Based on the obtained clusters, it is also possible to classify new possible named entities.</abstract>
<identifier type="citekey">silva-etal-2004-extracting</identifier>
<location>
<url>https://aclanthology.org/2004.jeptalnrecital-poster.21/</url>
</location>
<part>
<date>2004-04</date>
<extent unit="page">
<start>125</start>
<end>130</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Extracting Named Entities. A Statistical Approach
%A Silva, Joaquim
%A Kozareva, Zornitsa
%A Noncheva, Veska
%A Lopes, Gabriel
%Y Blache, Philippe
%Y Nguyen, Noël
%Y Chenfour, Nouredine
%Y Rajouani, Abdenbi
%S Actes de la 11ème conférence sur le Traitement Automatique des Langues Naturelles. Posters
%D 2004
%8 April
%I ATALA
%C Fès, Maroc
%F silva-etal-2004-extracting
%X Named entities and more generally Multiword Lexical Units (MWUs) are important for various applications. However, language independent methods for automatically extracting MWUs do not provide us with clean data. So, in this paper we propose a method for selecting possible named entities from automatically extracted MWUs, and later, a statistics-based language independent unsupervised approach is applied to possible named entities in order to cluster them according to their type. Statistical features used by our clustering process are described and motivated. The Model-Based Clustering Analysis (MBCA) software enabled us to obtain different clusters for proposed named entities. The method was applied to Bulgarian and English. For some clusters, precision is very high; other clusters still need further refinement. Based on the obtained clusters, it is also possible to classify new possible named entities.
%U https://aclanthology.org/2004.jeptalnrecital-poster.21/
%P 125-130
Markdown (Informal)
[Extracting Named Entities. A Statistical Approach](https://aclanthology.org/2004.jeptalnrecital-poster.21/) (Silva et al., JEP/TALN/RECITAL 2004)
ACL
- Joaquim Silva, Zornitsa Kozareva, Veska Noncheva, and Gabriel Lopes. 2004. Extracting Named Entities. A Statistical Approach. In Actes de la 11ème conférence sur le Traitement Automatique des Langues Naturelles. Posters, pages 125–130, Fès, Maroc. ATALA.