@inproceedings{49867361273848edae8e520c8a8947fa,
title = "Line-break prediction of hanmun text using recurrent neural networks",
abstract = "Recurrent neural network (RNN) has been broadly applied to natural language processing (NLP) and machine translation problems, by creating a deep learning model for sequential data. Hanmun is a Korean term for Chinese characters, and there are many cases in which Korean is pronounced by borrowing only the Chinese characters. Also, there are proper nouns and place names in the traditional Korean which are not used now. Therefore, we need a model for analyzing Hanmun rather than analyzing Chinese words in Chinese. In this paper, we propose a model for line-break prediction of Hanmun text using various types of RNNs. It is suitable for analyzing Hanmun meaning and usage vary according to the previous words. This model was used to segment the beginning and ending words of Hanmun characters and middle words. Experimental results show that our approach gets high performance in line-break prediction on Hanmun.",
keywords = "Bi-directional LSTM, Hanmun, line break, long short term memory (LSTM), recurrent neural network (RNN)",
author = "Oh, {Dong Hoon} and Zahra Shah and Jang, {Gil Jin}",
note = "Publisher Copyright: {\textcopyright} 2017 IEEE.; 8th International Conference on Information and Communication Technology Convergence, ICTC 2017 ; Conference date: 18-10-2017 Through 20-10-2017",
year = "2017",
month = dec,
day = "12",
doi = "10.1109/ICTC.2017.8190763",
language = "English",
series = "International Conference on Information and Communication Technology Convergence: ICT Convergence Technologies Leading the Fourth Industrial Revolution, ICTC 2017",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "720--724",
booktitle = "International Conference on Information and Communication Technology Convergence",
address = "United States",
}