@inproceedings{334b5ce19ea242ef82e9c8749ae0301c,
title = "Whunter: A focused web crawler – A tool for digital library",
abstract = "Topic-driven Web Crawler or focused crawler is the key tool of online web information library. It{\textquoteright}s a challenging issue that how to achieve good performance efficiently with limited time and space resources. This paper proposes a focused web crawler wHunter that implements incremental and multi-strategy learning by taking the advantages of both SVM (support vector machines) and na{\"i}ve Bayes. On the one hand, the initial performance is guaranteed via SVM classifier; on the other hand, when enough web pages are obtained, the classifier is switched to na{\"i}ve Bayes so that on-line incremental learning is achieved. Experimental results show that our proposed algorithm is efficient and easy to implement.",
author = "Yun Huang and Yunming Ye",
note = "Publisher Copyright: {\textcopyright} Springer-Verlag Berlin Heidelberg 2004.; 7th International Conference on Asian Digital Libraries, ICADL 2004 ; Conference date: 13-12-2004 Through 17-12-2004",
year = "2005",
doi = "10.1007/978-3-540-30544-6\_30",
language = "英语",
isbn = "9783540240303",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "519--522",
editor = "Qihao Miao and Ee-peng Lim and Zhaoneng Chen and Yuxi Fu and Hsinchun Chen and Edward Fox",
booktitle = "Digital Libraries",
address = "德国",
}