@article{ART003329445},
author={Dong-Hyuk Kim and Kyu-Cheol Cho},
title={Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2026},
volume={31},
number={4},
pages={33-44}
TY - JOUR
AU - Dong-Hyuk Kim
AU - Kyu-Cheol Cho
TI - Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap
JO - Journal of The Korea Society of Computer and Information
PY - 2026
VL - 31
IS - 4
PB - The Korean Society Of Computer And Information
SP - 33
EP - 44
SN - 1598-849X
AB - This study investigates how input representation granularity affects performance and training behavior in Korean-to-Korean Sign Language(KSL) gloss translation. Using the National Institute of Korean Language Korean-KSL parallel corpus (2022-2024), we compare a token/subword-based pretrained Seq2Seq model (KoBART) with a byte-level model (ByT5). Quantitative results show a decisive advantage for KoBART, which achieves 0.447 METEOR versus 0.1192 (≈275% relative improvement1)).
Analyses indicate that ByT5 is constrained by substantially longer effective sequences, which degrades sentence-level generation, whereas KoBART benefits from subword segmentation that effectively performs structural alignment with KSL glosses, demonstrating superior suitability in terms of faithful information reconstruction. These findings provide empirical evidence for the critical role of input granularity design in low-resource KSL gloss translation and establish a robust baseline for future KSL machine translation studies.
KW - KSL Gloss Translation;Input Granularity;KoBART;ByT5;Seq2Seq Model;Transformer
DO -
UR -
ER -
Dong-Hyuk Kim and Kyu-Cheol Cho. (2026). Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap. Journal of The Korea Society of Computer and Information, 31(4), 33-44.
Dong-Hyuk Kim and Kyu-Cheol Cho. 2026, "Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap", Journal of The Korea Society of Computer and Information, vol.31, no.4 pp.33-44.
Dong-Hyuk Kim, Kyu-Cheol Cho "Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap" Journal of The Korea Society of Computer and Information 31.4 pp.33-44 (2026) : 33.
Dong-Hyuk Kim, Kyu-Cheol Cho. Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap. 2026; 31(4), 33-44.
Dong-Hyuk Kim and Kyu-Cheol Cho. "Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap" Journal of The Korea Society of Computer and Information 31, no.4 (2026) : 33-44.
Dong-Hyuk Kim; Kyu-Cheol Cho. Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap. Journal of The Korea Society of Computer and Information, 31(4), 33-44.
Dong-Hyuk Kim; Kyu-Cheol Cho. Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap. Journal of The Korea Society of Computer and Information. 2026; 31(4) 33-44.
Dong-Hyuk Kim, Kyu-Cheol Cho. Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap. 2026; 31(4), 33-44.
Dong-Hyuk Kim and Kyu-Cheol Cho. "Byte-Level Processing Limits in KSL Translation: A Study of the KoBART–ByT5 Performance Gap" Journal of The Korea Society of Computer and Information 31, no.4 (2026) : 33-44.