Augment MS-EN dataset using augment-ms-en.ipynb.
- https://huggingface.co/datasets/mesolitica/noisy-ms-en-augmentation/resolve/main/augmented-ms-en-1.json
- https://huggingface.co/datasets/mesolitica/noisy-ms-en-augmentation/resolve/main/augmented-ms-en-2.json
- https://huggingface.co/datasets/mesolitica/noisy-ms-en-augmentation/resolve/main/augmented-ms-en-3.json
- https://huggingface.co/datasets/mesolitica/noisy-ms-en-augmentation/resolve/main/augmented-ms-en-v2.json
- https://huggingface.co/datasets/mesolitica/noisy-ms-en-augmentation/resolve/main/augmented-ms-en-v3.json
- https://huggingface.co/datasets/mesolitica/noisy-ms-en-augmentation/resolve/main/augmented-ms-en-test.json
@misc{Malay-Dataset, We gather Bahasa Malaysia corpus!, Noisy MS-EN Augmentation,
author = {Husein, Zolkepli},
title = {Malay-Dataset},
year = {2018},
publisher = {GitHub},
journal = {GitHub repository},
howpublished = {\url{https://github.com/huseinzol05/malay-dataset/tree/master/translation/noisy-ms-en-augmentation}}
}