@inproceedings{696d29cbc2584c54960413614a8f2c85,
title = "Towards extracting coherent user concerns and their hierarchical organization from user reviews",
abstract = "Mining user reviews to discover what the user likes and dislikes is vital to understanding user behaviors. Topic modeling techniques have been extensively used to discover meaningful topics for user reviews and to discover user behaviors. Extracted topics may be a mixture of different concepts and hence very likely to be less coherent and unclear, especially when extracting a relatively small number of topics. As such, we propose a method that extracts a relatively large number of topics using a topic modeling technique and relies on hierarchical clustering to exploit semantic distances between topics, to generate a small number of highly coherent and clear topics. We also compare this set of topics representing hidden user concerns extracted by our approach with those derived using LDA (Latent Dirichlet Allocation) and a hierarchical variant called Pachinko Allocation Model (PAM) and show that our method generates more coherent user concerns. Further, we also demonstrate how a hierarchical model of user concerns can be automatically generated by exploiting our approach. Such a hierarchy may help capture the conceptual distances between various user concerns and inherent similarities between users having those concerns.",
keywords = "Coherent user concerns, Hierarchical clustering, Recommendation systems, Topic modeling, User reviews",
author = "Ligaj Pradhan and Chengcui Zhang and Steven Bethard",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 17th IEEE International Conference on Information Reuse and Integration, IRI 2016 ; Conference date: 28-07-2016 Through 30-07-2016",
year = "2016",
doi = "10.1109/IRI.2016.85",
language = "English (US)",
series = "Proceedings - 2016 IEEE 17th International Conference on Information Reuse and Integration, IRI 2016",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "582--590",
booktitle = "Proceedings - 2016 IEEE 17th International Conference on Information Reuse and Integration, IRI 2016",
}