@inproceedings{d551f95fabd5432fae50f574575f8df6,
title = "Evaluating tag quality for blogger modelling via topic models",
abstract = "with the permission of annotating blog posts with tags, tags has become one of the most important resources used to describe blogger features. However, due to the irregular quality of tags, not all tags are appropriate for representing blogger's preferences. Poor tags or spam tags confuse the actual user's preferences and spam terms, thus they should be detected before they are directly used to tag bloggers. A detailed quantitative analysis on the categories of tag spam in the blogosphere is presented in this paper. Taking advantage of abundant text contents in blog posts and the relatively stable semantic relationship between tags and their target posts, an unsupervised approach based on topic models is proposed to evaluate tag quality for blogger modelling in the blogosphere. The latent interest topics of a blogger are mined out through Latent Dirichlet Allocation (LDA) topic modeling. The blog post of the blogger is represented as a distribution over latent topics and a latent topic is a distribution over words of the vocabulary. A tag is also expressed as a specific co-occurrence term vector. Ultimately, a scheme is devised to determine the similarity between each tag and its target blog post. Then the tags with less similarity value can be identified as poor tag. The experimental results indicate that the proposed method achieves more promising performance than the baselines on datasets collected from Sina Blog, which is one of the biggest Chinese blogs.",
keywords = "blog representation, semantic similarity, tag quality evaluation, topic model",
author = "Lili Shan and Chengjie Sun and Lei Lin and Ming Liu and Xiaolong Wang and Bingquan Liu",
note = "Publisher Copyright: {\textcopyright} 2015 IEEE.; 12th International Conference on Fuzzy Systems and Knowledge Discovery, FSKD 2015 ; Conference date: 15-08-2015 Through 17-08-2015",
year = "2016",
month = jan,
day = "13",
doi = "10.1109/FSKD.2015.7382215",
language = "英语",
series = "2015 12th International Conference on Fuzzy Systems and Knowledge Discovery, FSKD 2015",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1770--1776",
editor = "Zhuo Tang and Jiayi Du and Shu Yin and Renfa Li and Ligang He",
booktitle = "2015 12th International Conference on Fuzzy Systems and Knowledge Discovery, FSKD 2015",
address = "美国",
}