@inproceedings{b55741b5ecf64e2eaaffbf1728664b33,
title = "Semi-automatic Construction of Sight Words Dictionary for Filipino Text Readability",
abstract = "Readability formulas consider word familiarity as one of the factors for predicting the readability of children{\textquoteright}s books. Word familiarity is dependent on the frequency in which the words are encountered in daily reading. Often referred to as “sight words”, developing effective recognition of these high-frequency words can assist young readers to develop their reading fluency and comprehension. In this paper, we describe our work in building a dictionary of sight words for Filipino with the use of a corpus of Filipino literary materials written for children. We expanded the dictionary to a total of 664 words with the use of pre-trained word embedding model. The availability of such dictionary can facilitate the development of a readability formula for Filipino text, especially in the context of its lexical complexity.",
keywords = "Filipino text, High-frequency words, Text readability",
author = "Imperial, {Joseph Marvin} and Ethel Ong",
year = "2021",
month = feb,
day = "20",
doi = "10.1007/978-3-030-69886-7_14",
language = "English",
isbn = "9783030698850",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "168--177",
editor = "Hiroshi Uehara and Takayasu Yamaguchi and Quan Bai",
booktitle = "Knowledge Management and Acquisition for Intelligent Systems - 17th Pacific Rim Knowledge Acquisition Workshop, PKAW 2020, Proceedings",
address = "Germany",
note = "17th Pacific Rim Knowledge Acquisition Workshop, PKAW 2020 held in conjunction with the International Joint Conference on Artificial Intelligence - Pacific Rim International Conference on Artificial Intelligence, IJCAI-PRICAI 2020 ; Conference date: 07-01-2021 Through 08-01-2021",
}