Extracted from IMDA dataset, https://www.imda.gov.sg/
Total size: 181 MB, 3312135 sentences, https://f000.backblazeb2.com/file/malay-dataset/dumping/imda/singlish-text.json
@misc{Malay-Dataset, We gather Bahasa Malaysia corpus!, Singlish Texts,
author = {Husein, Zolkepli},
title = {Malay-Dataset},
year = {2018},
publisher = {GitHub},
journal = {GitHub repository},
howpublished = {\url{https://github.com/huseinzol05/malay-dataset/tree/master/dumping/singlish-text}}
}