@inproceedings{abeywardana-thayasivam-2020-privacy,
title = "A Privacy Preserving Data Publishing Middleware for Unstructured, Textual Social Media Data",
author = "Abeywardana, Prasadi and
Thayasivam, Uthayasanker",
editor = "Bhatia, Archna and
Shaikh, Samira",
booktitle = "Proceedings for the First International Workshop on Social Threats in Online Conversations: Understanding and Management",
month = may,
year = "2020",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://aclanthology.org/2020.stoc-1.4",
pages = "21--28",
abstract = "Privacy is going to be an integral part of data science and analytics in the coming years. The next hype of data experimentation is going to be heavily dependent on privacy preserving techniques mainly as it{'}s going to be a legal responsibility rather than a mere social responsibility. Privacy preservation becomes more challenging specially in the context of unstructured data. Social networks have become predominantly popular over the past couple of decades and they are creating a huge data lake at a high velocity. Social media profiles contain a wealth of personal and sensitive information, creating enormous opportunities for third parties to analyze them with different algorithms, draw conclusions and use in disinformation campaigns and micro targeting based dark advertising. This study provides a mitigation mechanism for disinformation campaigns that are done based on the insights extracted from personal/sensitive data analysis. Specifically, this research is aimed at building a privacy preserving data publishing middleware for unstructured social media data without compromising the true analytical value of those data. A novel way is proposed to apply traditional structured privacy preserving techniques on unstructured data. Creating a comprehensive twitter corpus annotated with privacy attributes is another objective of this research, especially because the research community is lacking one.",
language = "English",
ISBN = "979-10-95546-39-9",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="abeywardana-thayasivam-2020-privacy">
<titleInfo>
<title>A Privacy Preserving Data Publishing Middleware for Unstructured, Textual Social Media Data</title>
</titleInfo>
<name type="personal">
<namePart type="given">Prasadi</namePart>
<namePart type="family">Abeywardana</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Uthayasanker</namePart>
<namePart type="family">Thayasivam</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2020-05</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<language>
<languageTerm type="text">English</languageTerm>
<languageTerm type="code" authority="iso639-2b">eng</languageTerm>
</language>
<relatedItem type="host">
<titleInfo>
<title>Proceedings for the First International Workshop on Social Threats in Online Conversations: Understanding and Management</title>
</titleInfo>
<name type="personal">
<namePart type="given">Archna</namePart>
<namePart type="family">Bhatia</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Samira</namePart>
<namePart type="family">Shaikh</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>European Language Resources Association</publisher>
<place>
<placeTerm type="text">Marseille, France</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-10-95546-39-9</identifier>
</relatedItem>
<abstract>Privacy is going to be an integral part of data science and analytics in the coming years. The next hype of data experimentation is going to be heavily dependent on privacy preserving techniques mainly as it’s going to be a legal responsibility rather than a mere social responsibility. Privacy preservation becomes more challenging specially in the context of unstructured data. Social networks have become predominantly popular over the past couple of decades and they are creating a huge data lake at a high velocity. Social media profiles contain a wealth of personal and sensitive information, creating enormous opportunities for third parties to analyze them with different algorithms, draw conclusions and use in disinformation campaigns and micro targeting based dark advertising. This study provides a mitigation mechanism for disinformation campaigns that are done based on the insights extracted from personal/sensitive data analysis. Specifically, this research is aimed at building a privacy preserving data publishing middleware for unstructured social media data without compromising the true analytical value of those data. A novel way is proposed to apply traditional structured privacy preserving techniques on unstructured data. Creating a comprehensive twitter corpus annotated with privacy attributes is another objective of this research, especially because the research community is lacking one.</abstract>
<identifier type="citekey">abeywardana-thayasivam-2020-privacy</identifier>
<location>
<url>https://aclanthology.org/2020.stoc-1.4</url>
</location>
<part>
<date>2020-05</date>
<extent unit="page">
<start>21</start>
<end>28</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T A Privacy Preserving Data Publishing Middleware for Unstructured, Textual Social Media Data
%A Abeywardana, Prasadi
%A Thayasivam, Uthayasanker
%Y Bhatia, Archna
%Y Shaikh, Samira
%S Proceedings for the First International Workshop on Social Threats in Online Conversations: Understanding and Management
%D 2020
%8 May
%I European Language Resources Association
%C Marseille, France
%@ 979-10-95546-39-9
%G English
%F abeywardana-thayasivam-2020-privacy
%X Privacy is going to be an integral part of data science and analytics in the coming years. The next hype of data experimentation is going to be heavily dependent on privacy preserving techniques mainly as it’s going to be a legal responsibility rather than a mere social responsibility. Privacy preservation becomes more challenging specially in the context of unstructured data. Social networks have become predominantly popular over the past couple of decades and they are creating a huge data lake at a high velocity. Social media profiles contain a wealth of personal and sensitive information, creating enormous opportunities for third parties to analyze them with different algorithms, draw conclusions and use in disinformation campaigns and micro targeting based dark advertising. This study provides a mitigation mechanism for disinformation campaigns that are done based on the insights extracted from personal/sensitive data analysis. Specifically, this research is aimed at building a privacy preserving data publishing middleware for unstructured social media data without compromising the true analytical value of those data. A novel way is proposed to apply traditional structured privacy preserving techniques on unstructured data. Creating a comprehensive twitter corpus annotated with privacy attributes is another objective of this research, especially because the research community is lacking one.
%U https://aclanthology.org/2020.stoc-1.4
%P 21-28
Markdown (Informal)
[A Privacy Preserving Data Publishing Middleware for Unstructured, Textual Social Media Data](https://aclanthology.org/2020.stoc-1.4) (Abeywardana & Thayasivam, STOC 2020)
ACL