publications
publications by categories in reversed chronological order. generated by jekyll-scholar.
2024
- SEACrowd: A Multilingual Multimodal Data Hub and Benchmark Suite for Southeast Asian LanguagesHoly Lovenia, Rahmad Mahendra, Salsabil Maulana Akbar , and 58 more authors2024
@misc{lovenia2024seacrowdmultilingualmultimodaldata, title = {SEACrowd: A Multilingual Multimodal Data Hub and Benchmark Suite for Southeast Asian Languages}, author = {Lovenia, Holy and Mahendra, Rahmad and Akbar, Salsabil Maulana and Miranda, Lester James V. and Santoso, Jennifer and Aco, Elyanah and Fadhilah, Akhdan and Mansurov, Jonibek and Imperial, Joseph Marvin and Kampman, Onno P. and Moniz, Joel Ruben Antony and Habibi, Muhammad Ravi Shulthan and Hudi, Frederikus and Montalan, Railey and Ignatius, Ryan and Lopo, Joanito Agili and Nixon, William and Karlsson, Börje F. and Jaya, James and Diandaru, Ryandito and Gao, Yuze and Amadeus, Patrick and Wang, Bin and Cruz, Jan Christian Blaise and Whitehouse, Chenxi and Parmonangan, Ivan Halim and Khelli, Maria and Zhang, Wenyu and Susanto, Lucky and Ryanda, Reynard Adha and Hermawan, Sonny Lazuardi and Velasco, Dan John and Kautsar, Muhammad Dehan Al and Hendria, Willy Fitra and Moslem, Yasmin and Flynn, Noah and Adilazuarda, Muhammad Farid and Li, Haochen and Lee, Johanes and Damanhuri, R. and Sun, Shuo and Qorib, Muhammad Reza and Djanibekov, Amirbek and Leong, Wei Qi and Do, Quyet V. and Muennighoff, Niklas and Pansuwan, Tanrada and Putra, Ilham Firdausi and Xu, Yan and Tai, Ngee Chia and Purwarianti, Ayu and Ruder, Sebastian and Tjhi, William and Limkonchotiwat, Peerat and Aji, Alham Fikri and Keh, Sedrick and Winata, Genta Indra and Zhang, Ruochen and Koto, Fajri and Yong, Zheng-Xin and Cahyawijaya, Samuel}, year = {2024}, eprint = {2406.10118}, archiveprefix = {arXiv}, primaryclass = {cs.CL}, url = {https://arxiv.org/abs/2406.10118}, }
- CVQA: Culturally-diverse Multilingual Visual Question Answering BenchmarkDavid Romero, Chenyang Lyu, Haryo Akbarianto Wibowo , and 72 more authors2024
@misc{romero2024cvqaculturallydiversemultilingualvisual, title = {CVQA: Culturally-diverse Multilingual Visual Question Answering Benchmark}, author = {Romero, David and Lyu, Chenyang and Wibowo, Haryo Akbarianto and Lynn, Teresa and Hamed, Injy and Kishore, Aditya Nanda and Mandal, Aishik and Dragonetti, Alina and Abzaliev, Artem and Tonja, Atnafu Lambebo and Balcha, Bontu Fufa and Whitehouse, Chenxi and Salamea, Christian and Velasco, Dan John and Adelani, David Ifeoluwa and Meur, David Le and Villa-Cueva, Emilio and Koto, Fajri and Farooqui, Fauzan and Belcavello, Frederico and Batnasan, Ganzorig and Vallejo, Gisela and Caulfield, Grainne and Ivetta, Guido and Song, Haiyue and Ademtew, Henok Biadglign and Maina, Hernán and Lovenia, Holy and Azime, Israel Abebe and Cruz, Jan Christian Blaise and Gala, Jay and Geng, Jiahui and Ortiz-Barajas, Jesus-German and Baek, Jinheon and Dunstan, Jocelyn and Alemany, Laura Alonso and Nagasinghe, Kumaranage Ravindu Yasas and Benotti, Luciana and D'Haro, Luis Fernando and Viridiano, Marcelo and Estecha-Garitagoitia, Marcos and Cabrera, Maria Camila Buitrago and Rodríguez-Cantelar, Mario and Jouitteau, Mélanie and Mihaylov, Mihail and Imam, Mohamed Fazli Mohamed and Adilazuarda, Muhammad Farid and Gochoo, Munkhjargal and Otgonbold, Munkh-Erdene and Etori, Naome and Niyomugisha, Olivier and Silva, Paula Mónica and Chitale, Pranjal and Dabre, Raj and Chevi, Rendi and Zhang, Ruochen and Diandaru, Ryandito and Cahyawijaya, Samuel and Góngora, Santiago and Jeong, Soyeong and Purkayastha, Sukannya and Kuribayashi, Tatsuki and Jayakumar, Thanmay and Torrent, Tiago Timponi and Ehsan, Toqeer and Araujo, Vladimir and Kementchedjhieva, Yova and Burzo, Zara and Lim, Zheng Wei and Yong, Zheng Xin and Ignat, Oana and Nwatu, Joan and Mihalcea, Rada and Solorio, Thamar and Aji, Alham Fikri}, year = {2024}, eprint = {2406.05967}, archiveprefix = {arXiv}, primaryclass = {cs.CV}, url = {https://arxiv.org/abs/2406.05967}, }
- Could We Have Had Better Multilingual LLMs if English Was Not the Central Language?Ryandito Diandaru, Lucky Susanto, Zilu Tang , and 2 more authorsIn Proceedings of the Second International Workshop Towards Digital Language Equality (TDLE): Focusing on Sustainability @ LREC-COLING 2024 , May 2024
@inproceedings{diandaru-etal-2024-better, title = {Could We Have Had Better Multilingual {LLM}s if {E}nglish Was Not the Central Language?}, author = {Diandaru, Ryandito and Susanto, Lucky and Tang, Zilu and Purwarianti, Ayu and Wijaya, Derry Tanti}, editor = {Gaspari, Federico and Moorkens, Joss and Aldabe, Itziar and Farwell, Aritz and Altuna, Begona and Piperidis, Stelios and Rehm, Georg and Rigau, German}, booktitle = {Proceedings of the Second International Workshop Towards Digital Language Equality (TDLE): Focusing on Sustainability @ LREC-COLING 2024}, month = may, year = {2024}, address = {Torino, Italia}, publisher = {ELRA and ICCL}, url = {https://aclanthology.org/2024.tdle-1.4}, pages = {43--52}, }
2023
- Replicable Benchmarking of Neural Machine Translation (NMT) on Low-Resource Local Languages in IndonesiaLucky Susanto, Ryandito Diandaru, Adila Krisnadhi , and 2 more authorsIn Proceedings of the First Workshop in South East Asian Language Processing , Nov 2023
@inproceedings{susanto-etal-2023-replicable, title = {Replicable Benchmarking of Neural Machine Translation ({NMT}) on Low-Resource Local Languages in {I}ndonesia}, author = {Susanto, Lucky and Diandaru, Ryandito and Krisnadhi, Adila and Purwarianti, Ayu and Wijaya, Derry Tanti}, editor = {Wijaya, Derry and Aji, Alham Fikri and Vania, Clara and Winata, Genta Indra and Purwarianti, Ayu}, booktitle = {Proceedings of the First Workshop in South East Asian Language Processing}, month = nov, year = {2023}, address = {Nusa Dua, Bali, Indonesia}, publisher = {Association for Computational Linguistics}, url = {https://aclanthology.org/2023.sealp-1.8}, doi = {10.18653/v1/2023.sealp-1.8}, pages = {100--115}, }
- NusaCrowd: Open Source Initiative for Indonesian NLP ResourcesSamuel Cahyawijaya, Holy Lovenia, Alham Fikri Aji , and 45 more authorsIn Findings of the Association for Computational Linguistics: ACL 2023 , Jul 2023
@inproceedings{cahyawijaya-etal-2023-nusacrowd, title = {{N}usa{C}rowd: Open Source Initiative for {I}ndonesian {NLP} Resources}, author = {Cahyawijaya, Samuel and Lovenia, Holy and Aji, Alham Fikri and Winata, Genta and Wilie, Bryan and Koto, Fajri and Mahendra, Rahmad and Wibisono, Christian and Romadhony, Ade and Vincentio, Karissa and Santoso, Jennifer and Moeljadi, David and Wirawan, Cahya and Hudi, Frederikus and Wicaksono, Muhammad Satrio and Parmonangan, Ivan and Alfina, Ika and Putra, Ilham Firdausi and Rahmadani, Samsul and Oenang, Yulianti and Septiandri, Ali and Jaya, James and Dhole, Kaustubh and Suryani, Arie and Putri, Rifki Afina and Su, Dan and Stevens, Keith and Nityasya, Made Nindyatama and Adilazuarda, Muhammad and Hadiwijaya, Ryan and Diandaru, Ryandito and Yu, Tiezheng and Ghifari, Vito and Dai, Wenliang and Xu, Yan and Damapuspita, Dyah and Wibowo, Haryo and Tho, Cuk and Karo Karo, Ichwanul and Fatyanosa, Tirana and Ji, Ziwei and Neubig, Graham and Baldwin, Timothy and Ruder, Sebastian and Fung, Pascale and Sujaini, Herry and Sakti, Sakriani and Purwarianti, Ayu}, editor = {Rogers, Anna and Boyd-Graber, Jordan and Okazaki, Naoaki}, booktitle = {Findings of the Association for Computational Linguistics: ACL 2023}, month = jul, year = {2023}, address = {Toronto, Canada}, publisher = {Association for Computational Linguistics}, url = {https://aclanthology.org/2023.findings-acl.868}, doi = {10.18653/v1/2023.findings-acl.868}, pages = {13745--13818} }