2025

Infant Cry Detection Using Causal Temporal Representation
Minghao Fu, Danning Li, Aryan Gadhiya, Benjamin Lambright, Mohamed Alowais, Mohab Bahnassy, Saad El Dine Elletter, Hawau Olamide Toyin, Haiyan Jiang, Kun Zhang, Hanan Aldarmaki
ICASSP, 2025
PDF   Code   BibTeX @inproceedings{fu2025infant, title={Infant Cry Detection Using Causal Temporal Representation}, author={Fu, Minghao and Li, Danning and Gadhiya, Aryan and Lambright, Benjamin and Alowais, Mohamed and Bahnassy, Mohab and Elletter, Saad El Dine and Toyin, Hawau Olamide and Jiang, Haiyan and Zhang, Kun and Aldarmaki, Hanan}, booktitle={ICASSP 2025-2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)}, pages={1--5}, year={2025}, organization={IEEE} }

2024

PolyWER: A Holistic Evaluation Framework for Code-Switched Speech Recognition
Karima Kadaoui, Maryam Al Ali, Hawau Olamide Toyin, Ibrahim Mohammed, Hanan Aldarmaki
Findings of EMNLP, 2024
PDF   Code   HF Dataset   BibTeX @inproceedings{kadaoui-etal-2024-polywer, title = {PolyWER: A Holistic Evaluation Framework for Code-Switched Speech Recognition}, author = {Kadaoui, Karima and Al Ali, Maryam and Toyin, Hawau Olamide and Mohammed, Ibrahim and Aldarmaki, Hanan}, booktitle = {Findings of the Association for Computational Linguistics: EMNLP 2024}, year = {2024}, doi = {10.18653/v1/2024.findings-emnlp.356}, pages = {6144--6153} }

STTATTS: Unified Speech-To-Text And Text-To-Speech Model
Hawau Olamide Toyin, Hao Li, Hanan Aldarmaki
Findings of EMNLP, 2024
PDF  Code   BibTeX @inproceedings{toyin-etal-2024-sttatts, title = {STTATTS: Unified Speech-To-Text And Text-To-Speech Model}, author = {Toyin, Hawau Olamide and Li, Hao and Aldarmaki, Hanan}, booktitle = {Findings of the Association for Computational Linguistics: EMNLP 2024}, year = {2024}, doi = {10.18653/v1/2024.findings-emnlp.401}, pages = {6853--6863} }

Towards Automated Game-Based Early Screening for Language Disorder
Hamdan Hamid Al-Ali, Elsa Soares, Goncalo Leal, Rita Valente, Nicole Agrela, Alexandra Marquis, Hanan Aldarmaki
CLASP Conference on Multimodality and Interaction in Language Learning, 2024
PDF   BibTeX @inproceedings{al-ali-etal-2024-towards, title = {Towards Automated Game-Based Early Screening for Language Disorder}, author = {Al-Ali, Hamdan Hamid and Soares, Elsa and Leal, Goncalo and Valente, Rita and Agrela, Nicole and Marquis, Alexandra and Aldarmaki, Hanan}, booktitle = {Proceedings of the 2024 CLASP Conference on Multimodality and Interaction in Language Learning}, year = {2024}, address = {Gothenburg, Sweden}, publisher = {Association for Computational Linguistics}, pages = {26--31} }

PALM: Few-Shot Prompt Learning for Audio Language Models
Asif Hanif, Maha Tufail Agro, Mohammad Areeb Qazi, Hanan Aldarmaki
EMNLP, 2024
PDF   Code   BibTeX @inproceedings{hanif2024palm, title={PALM: Few-Shot Prompt Learning for Audio Language Models}, author={Hanif, Asif and Agro, Maha and Qazi, Mohammad and Aldarmaki, Hanan}, booktitle={Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing}, pages={18527--18536}, year={2024} }

Spoken Word2Vec: Learning Skipgram Embeddings from Speech
Mohammad Amaan Sayeed, Hanan Aldarmaki
Interspeech, 2024
PDF   Code   BibTeX @inproceedings{sayeed24_interspeech, title = {Spoken Word2Vec: Learning Skipgram Embeddings from Speech}, author = {Mohammad Amaan Sayeed and Hanan Aldarmaki}, booktitle = {Interspeech 2024}, year = {2024}, pages = {2920--2924}, doi = {10.21437/Interspeech.2024-2181}, issn = {2958-1796} }

Data Augmentation for Speech-Based Diacritic Restoration
Sara Shatnawi, Sawsan Alqahtani, Shady Shehata, Hanan Aldarmaki
ArabicNLP, 2024
PDF   Code   BibTeX @inproceedings{shatnawi-etal-2024-data, title = {Data Augmentation for Speech-Based Diacritic Restoration}, author = {Shatnawi, Sara and Alqahtani, Sawsan and Shehata, Shady and Aldarmaki, Hanan}, booktitle = {Proceedings of The Second Arabic Natural Language Processing Conference}, year = {2024}, doi = {10.18653/v1/2024.arabicnlp-1.15}, pages = {160--169} }

Automatic Restoration of Diacritics for Speech Data Sets
Sara Shatnawi, Sawsan Alqahtani, Hanan Aldarmaki
NAACL, 2024
PDF   Code   BibTeX @inproceedings{shatnawi-etal-2024-automatic, title = {Automatic Restoration of Diacritics for Speech Data Sets}, author = {Shatnawi, Sara and Alqahtani, Sawsan and Aldarmaki, Hanan}, booktitle = {Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers)}, year = {2024}, doi = {10.18653/v1/2024.naacl-long.233} }

Mixat: A Data Set of Bilingual Emirati-English Speech
Maryam Khalifa Al Ali, Hanan Aldarmaki
SIGUL @ LREC-COLING, 2024
PDF   Source  HF Dataset   BibTeX @inproceedings{al-ali-aldarmaki-2024-mixat, title = {Mixat: A Data Set of Bilingual Emirati-English Speech}, author = {Al Ali, Maryam Khalifa and Aldarmaki, Hanan}, booktitle = {Proceedings of the 3rd Annual Meeting of the Special Interest Group on Under-resourced Languages @ LREC-COLING 2024}, year = {2024}, pages = {222--226} }

2023

ArTST: Arabic Text and Speech Transformer
Hawau Olamide Toyin, Amirbek Djanibekov, Ajinkya Kulkarni, Hanan Aldarmaki
ArabicNLP, 2023
PDF   Code   HF Model   BibTeX @inproceedings{toyin2023artst, title={ArTST: Arabic Text and Speech Transformer}, author={Toyin, Hawau and Djanibekov, Amirbek and Kulkarni, Ajinkya and Aldarmaki, Hanan}, booktitle={Proceedings of ArabicNLP 2023}, pages={41--51}, year={2023}, doi = {10.18653/v1/2023.arabicnlp-1.5} }

Yet Another Model for Arabic Dialect Identification
Ajinkya Kulkarni, Hanan Aldarmaki
ArabicNLP, 2023
PDF   BibTeX @inproceedings{kulkarni2023yet, title={Yet Another Model for Arabic Dialect Identification}, author={Kulkarni, Ajinkya and Aldarmaki, Hanan}, booktitle={Proceedings of ArabicNLP 2023}, pages={435--440}, year={2023} }

Handling Realistic Label Noise in BERT Text Classification
Maha Agro, Hanan Aldarmaki
ICNLSP, 2023
PDF   BibTeX @inproceedings{agro2023handling, title={Handling Realistic Label Noise in BERT Text Classification}, author={Agro, Maha and Aldarmaki, Hanan}, booktitle={Proceedings of the 6th International Conference on Natural Language and Speech Processing (ICNLSP 2023)}, pages={11--20}, year={2023} }

Diacritic Recognition Performance in Arabic ASR
Hanan Aldarmaki, Ahmad Ghannam
Interspeech, 2023
PDF   BibTeX @inproceedings{aldarmaki2023diacritic, title={Diacritic Recognition Performance in Arabic ASR}, author={Aldarmaki, Hanan and Ghannam, Ahmad}, booktitle={Proc. Interspeech 2023}, pages={361--365}, year={2023} }

ClArTTS: An Open-Source Classical Arabic Text-to-Speech Corpus
Ajinkya Kulkarni, Atharva Kulkarni, Sara Abedalmon'em Mohammad Shatnawi, Hanan Aldarmaki
Interspeech, 2023
PDF   HF Dataset   BibTeX @inproceedings{kulkarni2023clartts, title={ClArTTS: An Open-Source Classical Arabic Text-to-Speech Corpus}, author={Kulkarni, Ajinkya and Kulkarni, Atharva and Shatnawi, Sara Abedalmon'em Mohammad and Aldarmaki, Hanan}, booktitle={Proc. Interspeech 2023}, pages={5511--5515}, year={2023}, doi={10.21437/Interspeech.2023-2224} }

Earlier

Supervised Acoustic Embeddings And Their Transferability Across Languages
Sreepratha Ram, Hanan Aldarmaki
ICNLSP, 2022
PDF   Code   BibTeX @inproceedings{ram2022supervised, title={Supervised Acoustic Embeddings And Their Transferability Across Languages}, author={Ram, Sreepratha and Aldarmaki, Hanan}, booktitle={Proceedings of the 5th International Conference on Natural Language and Speech Processing (ICNLSP 2022)}, pages={212--218}, year={2022} }

Unsupervised Automatic Speech Recognition: A Review
Hanan Aldarmaki, Asad Ullah, Sreepratha Ram, Nazar Zaki
Speech Communication, 2022
PDF   HTML BibTeX @article{ALDARMAKI202276, title = {Unsupervised Automatic Speech Recognition: A review}, journal = {Speech Communication}, volume = {139}, pages = {76-91}, year = {2022}, issn = {0167-6393}, doi = {https://doi.org/10.1016/j.specom.2022.02.005}, url = {https://www.sciencedirect.com/science/article/pii/S0167639322000292}, author = {Hanan Aldarmaki and Asad Ullah and Sreepratha Ram and Nazar Zaki}, }

Homograph Disambiguation through Selective Diacritic Restoration
Sawsan Alqahtani, Hanan Aldarmaki, Mona Diab
Arabic NLP, 2019
PDF   BibTeX @inproceedings{alqahtani2019homograph, title={Homograph Disambiguation through Selective Diacritic Restoration}, author={Alqahtani, Sawsan and Aldarmaki, Hanan and Diab, Mona}, booktitle={Proceedings of the Fourth Arabic Natural Language Processing Workshop}, pages={49--59}, year={2019} }

Efficient Sentence Embedding using Discrete Cosine Transform
Nada Almarwani, Hanan Aldarmaki, Mona Diab
EMNLP, 2019
PDF   Code   BibTeX @inproceedings{almarwani2019efficient, title={Efficient Sentence Embedding using Discrete Cosine Transform}, author={Almarwani, Nada and Aldarmaki, Hanan and Diab, Mona}, booktitle={Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP)}, pages={3672--3678}, year={2019} }

Scalable Cross-Lingual Transfer of Neural Sentence Embeddings
Hanan Aldarmaki, Mona Diab
*SEM, 2019
PDF   BibTeX @inproceedings{aldarmaki2019scalable, title={Scalable Cross-Lingual Transfer of Neural Sentence Embeddings}, author={Aldarmaki, Hanan and Diab, Mona}, booktitle={Proceedings of the Eighth Joint Conference on Lexical and Computational Semantics (* SEM 2019)}, pages={51--60}, year={2019} }

Context-Aware Cross-Lingual Mapping
Hanan Aldarmaki, Mona Diab
NAACL, 2019
PDF   Code   BibTeX @inproceedings{aldarmaki2019context, title={Context-Aware Cross-Lingual Mapping}, author={Aldarmaki, Hanan and Diab, Mona}, booktitle={Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers)}, pages={3906--3911}, year={2019} }

Evaluation of Unsupervised Compositional Representations
Hanan Aldarmaki, Mona Diab
COLING, 2018
PDF   Code   BibTeX @inproceedings{aldarmaki2018evaluation, title={Evaluation of Unsupervised Compositional Representations}, author={Aldarmaki, Hanan and Diab, Mona}, booktitle={Proceedings of the 27th International Conference on Computational Linguistics}, pages={2666--2677}, year={2018} }

Unsupervised Word Mapping Using Structural Similarities in Monolingual Embedding
Hanan Aldarmaki, Mahesh Mohan, Mona Diab
TACL, 2018
PDF   Code   BibTeX @article{aldarmaki2018unsupervised, title={Unsupervised Word Mapping Using Structural Similarities in Monolingual Embeddings}, author={Aldarmaki, Hanan and Mohan, Mahesh and Diab, Mona}, journal={Transactions of the Association for Computational Linguistics}, volume={6}, pages={185--196}, year={2018} }

Learning Cross-lingual Representations with Matrix Factorization
Hanan Aldarmaki, Mahesh Mohan, Mona Diab
Workshop on Multilingual and Cross-lingual Methods in NLP, 2016
PDF   Code   BibTeX @inproceedings{aldarmaki2016learning, title={Learning cross-lingual representations with matrix factorization}, author={Aldarmaki, Hanan and Diab, Mona}, booktitle={Proceedings of the Workshop on Multilingual and Cross-lingual Methods in NLP}, pages={1--9}, year={2016} }

Robust Part-of-Speech Tagging of Arabic Text
Hanan Aldarmaki, Mahesh Mohan, Mona Diab
Arabic NLP, 2015
PDF BibTeX @inproceedings{aldarmaki2015robust, title={Robust part-of-speech tagging of Arabic text}, author={Aldarmaki, Hanan and Diab, Mona}, booktitle={Proceedings of the Second Workshop on Arabic Natural Language Processing}, pages={173--182}, year={2015} }