🎉 🎉 🎉 The Amharic Hate Speech Dataset is uploaded in Huggingface Amharic Hate Speech Dataset 🎉 🎉 🎉
🎉 🎉 🎉 The Amharic Hate Speech Classification Model is uploaded in Huggingface Amharic Hate Speech Model 🎉 🎉 🎉
On this page, we are introducing four datasets on Amharic hate speech detection and classification models:
- Dataset: RANLP-2023
- Dataset: ICT4DA-2022
- Dataset: TRAC-LREC-COLLING-2024 Hate Targets and Intensity
- Dataset: TRAC-LREC-COLLING-2024 HateMem
The code for HateMem is available Here
Please read our papers for the details
Detecting Hate Speech in Amharic Using Multimodal Analysis of Social Media Memes
@INPROCEEDINGS{melese2024,
author={Melese Ayichlie Jigar and Abinew Ali Ayele and Seid Muhie Yimam and Chris Biemann},
booktitle={Proceedings of The Fourth Workshop on Threat, Aggression & Cyberbullying },
title={Detecting Hate Speech in Amharic Using Multimodal Analysis of Social Media Memes},
pages={},
year={2024},
location = {Torino, Italy}
}
Exploring Boundaries and Intensities in Offensive and Hate Speech: Unveiling the Complex Spectrum of Social Media Discourse
@INPROCEEDINGS{ayele-exploring2024,
author={Abinew Ali Ayele and Esubalew Alemneh Jalew and Adem Chanie Ali and and Seid Muhie Yimam and Chris Biemann},
booktitle={Proceedings of The Fourth Workshop on Threat, Aggression & Cyberbullying },
title={Exploring Boundaries and Intensities in Offensive and Hate Speech: Unveiling the Complex Spectrum of Social Media Discourse},
pages={},
year={2024},
location = {Torino, Italy}
}
Exploring Amharic Hate Speech Data Collection and Classification Approaches
@INPROCEEDINGS{ayelexplorhate2023,
author={Ayele, Abinew Ali and Yimam, Seid Muhie and Belay, Tadesse Destaw and Asfaw, Tesfa and Biemann, Chris},
booktitle={Proceedings of the 14th International Conference on RECENT ADVANCES IN NATURAL LANGUAGE PROCESSING (RANLP 2023},
title={Exploring Amharic Hate Speech Data Collection and Classification Approaches},
pages={49--59},
year={2023},
location = {Varna, Bulgaria}
}
The 5Js in Ethiopia: Amharic Hate Speech Data Annotation Using Toloka Crowdsourcing Platform
@inproceedings{ayele20225js,
title={{The 5Js in Ethiopia: Amharic hate speech data annotation using Toloka Crowdsourcing Platform}},
author={Ayele, Abinew Ali and Dinter, Skadi and Belay, Tadesse Destaw and Asfaw, Tesfa Tegegne and Yimam, Seid Muhie and Biemann, Chris},
booktitle={2022 International Conference on Information and Communication Technology for Development for Africa (ICT4DA)},
pages={114--120},
year={2022},
url = {https://ieeexplore.ieee.org/document/9971189},
address ={Bahir Dar, Ethiopia},
}
Challenges of Amharic Hate Speech Data Annotation Using Yandex Toloka Crowdsourcing Platform
@inproceedings{ayelechallenges,
title={Challenges of Amharic Hate Speech Data Annotation Using Yandex Toloka Crowdsourcing Platform},
author={Ayele, Abinew Ali and Belay, Tadesse Destaw and Yimam, Seid Muhie and Dinter, Skadi and Asfaw, Tesfa Tegegne and Biemann, Chris},
booktitle = {Proceedings of the The Sixth Widening NLP Workshop (WiNLP) co-located with EMNLP 2022},
year = {2022},
address = {Abu Dhabi, United Arab Emirates},
publisher = {Association for Computational Linguistics},
url = {https://aclanthology.org/2022.winlp-1.0},
}