2025
Chowdhury, Sinthia; Remal, Deawan Rakin Ahamed; Pasha, Syed Tangim; Islam, Ashraful; Noori, Sheak Rashed Haider
ChatgaiyyaAlap: A dataset for conversion from Chittagonian dialect to standard Bangla Journal Article
In: Data in Brief, vol. 59, pp. 111413, 2025, ISSN: 2352-3409.
Abstract | Links | BibTeX | Tags: Bangladesh, Bengali language, Dialect, Natural language processing
@article{CHOWDHURY2025111413,
title = {ChatgaiyyaAlap: A dataset for conversion from Chittagonian dialect to standard Bangla},
author = {Sinthia Chowdhury and Deawan Rakin Ahamed Remal and Syed Tangim Pasha and Ashraful Islam and Sheak Rashed Haider Noori},
url = {https://www.sciencedirect.com/science/article/pii/S2352340925001453},
doi = {https://doi.org/10.1016/j.dib.2025.111413},
issn = {2352-3409},
year = {2025},
date = {2025-01-01},
journal = {Data in Brief},
volume = {59},
pages = {111413},
abstract = {Bangla is one of the most used languages around the world with 240 million speakers. The standard Bangla language is the official language of people from Bangladesh and a few other parts outside Bangladesh, like West Bengal and Tripura. Although, people from different areas of Bangladesh do not use standard Bangla on a day-to-day basis. Instead, dialects of the Bangla language are used. The dialects of the Bangla language are quite diverse which includes the Rajshahi dialect, Sylheti dialect, Old Dhaka dialect, Chittagonian dialect, and many more. Nearly every division of Bangladesh has its unique dialect which adds linguistic diversity to the language. The main difference between the standard Bangla language and Chittagonian dialect is that it does not have any written form and the words vary from the standard Bangla. We built a dataset containing standard Bangla and one of its most used dialects: the Chittagonian dialect. Our dataset, “ChatgaiyyaAlap,” was created by combining 4012 unique sentences in standard Bangla with their Chittagonian translations, which were gathered from dramas, comments, and videos on YouTube and Facebook. In our dataset, we cleaned the data by removing emojis, punctuations, and unessential spaces. The dissimilarity in spelling as well as in sentence structure between standard Bangla and Chittagonian dialects, particularly in negative sentences can be clearly visible through this dataset. Additionally, to maintain the data accuracy, we developed a dictionary containing 1,500 standard Bangla words and their Chittagonian form. The dictionary showcases significant variation in the vocabulary of both languages and resolves ambiguities along with potential biases. To perform a word-to-word translation this dictionary would be useful, while for studying comparative linguistics and developing intelligent systems the ChatgaiyyaAlap dataset might assist the researchers. Moreover, this dataset can be utilized to train language models for linguistic translation.},
keywords = {Bangladesh, Bengali language, Dialect, Natural language processing},
pubstate = {published},
tppubtype = {article}
}
Sultana, Zinnat; Akter, Miss. Rokeya; Rahman, Tanveer Ehsanur; Ferdous, Hasan Shahid; Wulandari, Teresa; Amin, M Ashraful; Ahmed, Syed Ishtiaque; Sultana, Sharifa
Internet Disconnection as a Risk to Cross-Border Human Rights Proceedings Article
In: Proceedings of the Extended Abstracts of the CHI Conference on Human Factors in Computing Systems, Association for Computing Machinery, New York, NY, USA, 2025, ISBN: 9798400713958.
Abstract | Links | BibTeX | Tags: Bangladesh, Cross-border, Ethics, Human Rights, ICTD, Immigrants, July Uprising, Justice
@inproceedings{10.1145/3706599.3720245,
title = {Internet Disconnection as a Risk to Cross-Border Human Rights},
author = {Zinnat Sultana and Miss. Rokeya Akter and Tanveer Ehsanur Rahman and Hasan Shahid Ferdous and Teresa Wulandari and M Ashraful Amin and Syed Ishtiaque Ahmed and Sharifa Sultana},
url = {https://doi.org/10.1145/3706599.3720245},
doi = {10.1145/3706599.3720245},
isbn = {9798400713958},
year = {2025},
date = {2025-01-01},
booktitle = {Proceedings of the Extended Abstracts of the CHI Conference on Human Factors in Computing Systems},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
series = {CHI EA '25},
abstract = {One of the biggest movements organized by Gen-Z is the July-August 2024 quota reformation movement in Bangladesh. During this movement, the government in power of Bangladesh shut down the internet nationwide for ten consecutive days to suppress the voices of people and disconnect them from the rest of the world. Our ongoing project investigates the movement and analyzes this crisis. We are currently conducting interviews with Bangladeshi people living outside of Bangladesh to understand the trouble they faced due to the internet shutdown and found that their human rights were violated in multiple ways. The participants informed us about how propaganda spread, which was impossible to verify due to the internet shutdown, resulting in more chaos and confusion during that time and possibly leading to more damage to the nation and its resources. We present the findings and discuss possible directions for HCI.},
keywords = {Bangladesh, Cross-border, Ethics, Human Rights, ICTD, Immigrants, July Uprising, Justice},
pubstate = {published},
tppubtype = {inproceedings}
}

