Skip to content

uhh-lt/AmharicHateSpeech

Folders and files

NameName
Last commit message
Last commit date

Latest commit

 
 
 
 
 
 
 
 
 
 
 
 
 

Repository files navigation


🎉 🎉 🎉 The Amharic Hate Speech Dataset uploaded in Huggingface Amharic Hate Speech 🎉 🎉 🎉


Data

On this page, we are introducing four datasets on Amharic hate speech detection and classification models:


  1. Dataset: RANLP-2023
  2. Dataset: ICT4DA-2022
  3. Dataset: TRAC-LREC-COLLING-2024 Hate Targets and Intensity
  4. Dataset: TRAC-LREC-COLLING-2024 HateMem

Code

The code for HateMem is available Here

Please read our papers for the details

Detecting Hate Speech in Amharic Using Multimodal Analysis of Social Media Memes

@INPROCEEDINGS{melese2024,  
author={Melese Ayichlie Jigar and Abinew Ali Ayele and Seid Muhie Yimam and Chris Biemann},  
booktitle={Proceedings of The Fourth Workshop on Threat, Aggression & Cyberbullying },   
title={Detecting Hate Speech in Amharic Using Multimodal Analysis of Social Media Memes},
pages={},  
year={2024},    
location = {Torino, Italy}
}

Exploring Boundaries and Intensities in Offensive and Hate Speech: Unveiling the Complex Spectrum of Social Media Discourse

@INPROCEEDINGS{ayele-exploring2024,  
author={Abinew Ali Ayele and Esubalew Alemneh Jalew and Adem Chanie Ali and  and Seid Muhie Yimam and Chris Biemann},  
booktitle={Proceedings of The Fourth Workshop on Threat, Aggression & Cyberbullying },   
title={Exploring Boundaries and Intensities in Offensive and Hate Speech: Unveiling the Complex Spectrum of Social Media Discourse},
pages={},  
year={2024},    
location = {Torino, Italy}
}

Exploring Amharic Hate Speech Data Collection and Classification Approaches

@INPROCEEDINGS{ayelexplorhate2023,  
author={Ayele, Abinew Ali and Yimam, Seid Muhie and Belay, Tadesse Destaw and Asfaw, Tesfa and  Biemann, Chris},  
booktitle={Proceedings of the 14th International Conference on RECENT ADVANCES IN NATURAL LANGUAGE PROCESSING (RANLP 2023},   
title={Exploring Amharic Hate Speech Data Collection and Classification Approaches},
pages={49--59},  
year={2023},    
location = {Varna, Bulgaria}
}

The 5Js in Ethiopia: Amharic Hate Speech Data Annotation Using Toloka Crowdsourcing Platform

@inproceedings{ayele20225js,
  title={{The 5Js in Ethiopia: Amharic hate speech data annotation using Toloka Crowdsourcing Platform}},
  author={Ayele, Abinew Ali and Dinter, Skadi and Belay, Tadesse Destaw and Asfaw, Tesfa Tegegne and Yimam, Seid Muhie and Biemann, Chris},
  booktitle={2022 International Conference on Information and Communication Technology for Development for Africa (ICT4DA)},
  pages={114--120},
  year={2022},
  url = {https://ieeexplore.ieee.org/document/9971189},
  address ={Bahir Dar, Ethiopia},
}

Challenges of Amharic Hate Speech Data Annotation Using Yandex Toloka Crowdsourcing Platform

@inproceedings{ayelechallenges,
  title={Challenges of Amharic Hate Speech Data Annotation Using Yandex Toloka Crowdsourcing Platform},
  author={Ayele, Abinew Ali and Belay, Tadesse Destaw and Yimam, Seid Muhie and Dinter, Skadi and Asfaw, Tesfa Tegegne and Biemann, Chris},
 booktitle = {Proceedings of the The Sixth Widening NLP Workshop (WiNLP) co-located with EMNLP 2022},
  year = {2022},
  address = {Abu Dhabi, United Arab Emirates},
  publisher = {Association for Computational Linguistics},
  url = {https://aclanthology.org/2022.winlp-1.0},
}

About

Amharic Hate Speech - Dataset and classification Models

Resources

Stars

Watchers

Forks

Releases

No releases published

Packages

No packages published