@inproceedings{7865585f661e4ea9b3260fef66b3058d,
title = "Data mining for news content: a case of Cantonese opera news topic modelling analysis",
abstract = "Topic modelling approach is widely used for text data mining in NLP(Natural Language Processing). Text mining has been used for analysis of ICH (intangible cultural heritage), where Cantonese opera is a representative ICH of Lingnan culture. This study retrieved news content on Cantonese Opera and used machine learning analysis (LDA topic modelling) method to find out the distribution of the topics. Four main themes are concluded: the development, cooperation, and inheritance of Cantonese opera(taken up to 45.1% in all data); The traditional form(23.5%); Innovative forms(18.3%); Education and cultural inheritance of Cantonese opera(13.2%). This research further explored how to better promote Cantonese opera by analysing the topics as well as the data, and suggested that emphasis should be placed on the innovation of traditional elements in Cantonese opera, keeping them close to life, and education.",
keywords = "Cantonese opera, Data mining, LDA, machine learning, NLP, topic modelling",
author = "Bifeng Wang and Xiaotong Xu and Haocih Chen and Xinyi Xie and Jiawei Chen and Qian Liu and Yong Fu",
note = "Publisher Copyright: {\textcopyright} 2023 SPIE.; 3rd International Conference on Intelligent Computing and Human-Computer Interaction, ICHCI 2022 ; Conference date: 12-08-2022 Through 14-08-2022",
year = "2023",
doi = "10.1117/12.2656041",
language = "English",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
publisher = "SPIE",
editor = "Kannimuthu Subramanian",
booktitle = "Third International Conference on Intelligent Computing and Human-Computer Interaction, ICHCI 2022",
}