{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,15]],"date-time":"2026-04-15T10:08:36Z","timestamp":1776247716986,"version":"3.50.1"},"reference-count":38,"publisher":"Elsevier BV","issue":"3","license":[{"start":{"date-parts":[[2013,5,1]],"date-time":"2013-05-01T00:00:00Z","timestamp":1367366400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Information Processing &amp; Management"],"published-print":{"date-parts":[[2013,5]]},"DOI":"10.1016\/j.ipm.2012.12.004","type":"journal-article","created":{"date-parts":[[2013,1,20]],"date-time":"2013-01-20T09:31:48Z","timestamp":1358674308000},"page":"596-606","source":"Crossref","is-referenced-by-count":11,"title":["Clustering tagged documents with labeled and unlabeled documents"],"prefix":"10.1016","volume":"49","author":[{"given":"Chien-Liang","family":"Liu","sequence":"first","affiliation":[]},{"given":"Wen-Hoar","family":"Hsaio","sequence":"additional","affiliation":[]},{"given":"Chia-Hoang","family":"Lee","sequence":"additional","affiliation":[]},{"given":"Chun-Hsien","family":"Chen","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.ipm.2012.12.004_b0005","series-title":"Proceedings of the 25th annual international ACM SIGIR conference on research and development in information retrieval. SIGIR \u201902.","first-page":"105","article-title":"The use of unlabeled data to improve supervised learning for text summarization","author":"Amini","year":"2002"},{"key":"10.1016\/j.ipm.2012.12.004_b0010","series-title":"Proceedings of the nineteenth international conference on machine learning. ICML \u201902.","first-page":"27","article-title":"Semi-supervised clustering by seeding","author":"Basu","year":"2002"},{"key":"10.1016\/j.ipm.2012.12.004_b0015","series-title":"Proceedings of the tenth ACM SIGKDD international conference on knowledge discovery and data mining. KDD \u201904.","first-page":"59","article-title":"A probabilistic framework for semi-supervised clustering","author":"Basu","year":"2004"},{"key":"10.1016\/j.ipm.2012.12.004_b0020","unstructured":"Begelman, G., Keller, P., & Smadja, F. (2006). Automated tag clustering: Improving search and exploration in the tag space. In Collaborative web tagging workshop at WWW2006."},{"key":"10.1016\/j.ipm.2012.12.004_b0025","unstructured":"Berendt, B., Hanser, C. (2007). Tags are not metadata, but just more content to some people. In ICWSM 07."},{"issue":"March","key":"10.1016\/j.ipm.2012.12.004_b0030","first-page":"993","article-title":"Latent Dirichlet allocation","volume":"3","author":"Blei","year":"2003","journal-title":"Journal of Machine Learning Research"},{"key":"10.1016\/j.ipm.2012.12.004_b0035","unstructured":"Brooks, C. H., & Montanez, N. (2005). An analysis of the effectiveness of tagging in blogs. In AAAI spring symposium on computational approaches to analyzing Weblogs. AAAI."},{"key":"10.1016\/j.ipm.2012.12.004_b0040","series-title":"WSDM \u201909: Proceedings of the second ACM international conference on web search and data mining","first-page":"84","article-title":"Improving music genre classification using collaborative tagging data","author":"Chen","year":"2009"},{"issue":"September","key":"10.1016\/j.ipm.2012.12.004_b0045","first-page":"61","article-title":"An unsupervised automated essay scoring system","volume":"25","author":"Chen","year":"2010","journal-title":"IEEE Intelligent Systems"},{"key":"10.1016\/j.ipm.2012.12.004_b0050","doi-asserted-by":"crossref","first-page":"391","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9","article-title":"Indexing by latent semantic analysis","volume":"41","author":"Deerwester","year":"1990","journal-title":"Journal of the American Society of Information Science"},{"issue":"1","key":"10.1016\/j.ipm.2012.12.004_b0055","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1111\/j.2517-6161.1977.tb01600.x","article-title":"Maximum likelihood from incomplete data via the EM algorithm","volume":"39","author":"Dempster","year":"1977","journal-title":"Journal of the Royal Statistical Society, Series B"},{"issue":"April","key":"10.1016\/j.ipm.2012.12.004_b0060","doi-asserted-by":"crossref","first-page":"3913","DOI":"10.1016\/j.csda.2008.01.011","article-title":"On the equivalence between non-negative matrix factorization and probabilistic latent semantic indexing","volume":"52","author":"Ding","year":"2008","journal-title":"Computational Statistics and Data Analysis"},{"key":"10.1016\/j.ipm.2012.12.004_b0065","series-title":"Proceedings of the 28th annual international ACM SIGIR conference on research and development in information retrieval. SIGIR \u201905.","first-page":"601","article-title":"Relation between PLSA and NMF and implications","author":"Gaussier","year":"2005"},{"key":"10.1016\/j.ipm.2012.12.004_b0070","series-title":"Proceedings of the 26th annual international ACM SIGIR conference on research and development in information retrieval. SIGIR \u201903.","first-page":"433","article-title":"On an equivalence between PLSI and LDA","author":"Girolami","year":"2003"},{"issue":"Suppl. 1","key":"10.1016\/j.ipm.2012.12.004_b0075","doi-asserted-by":"crossref","first-page":"5228","DOI":"10.1073\/pnas.0307752101","article-title":"Finding scientific topics","volume":"101","author":"Griffiths","year":"2004","journal-title":"Proceedings of the National Academy of Sciences"},{"key":"10.1016\/j.ipm.2012.12.004_b0080","series-title":"IJCAI\u201907: Proceedings of the 20th international joint conference on artificial intelligence","first-page":"2772","article-title":"An analysis of the use of tags in a blog recommender system","author":"Hayes","year":"2007"},{"key":"10.1016\/j.ipm.2012.12.004_b0085","unstructured":"Hofmann, T. (1999). Probabilistic latent semantic analysis. In Proc. of uncertainty in artificial intelligence, UAI\u201999."},{"issue":"1\u20132","key":"10.1016\/j.ipm.2012.12.004_b0090","doi-asserted-by":"crossref","first-page":"177","DOI":"10.1023\/A:1007617005950","article-title":"Unsupervised learning by probabilistic latent semantic analysis","volume":"42","author":"Hofmann","year":"2001","journal-title":"Machine Learning"},{"key":"10.1016\/j.ipm.2012.12.004_b0095","series-title":"Proceedings of the 1998 conference on Advances in neural information processing systems II.","first-page":"466","article-title":"Learning from dyadic data","author":"Hofmann","year":"1999"},{"key":"10.1016\/j.ipm.2012.12.004_b0100","series-title":"Proceedings of the 29th annual international ACM SIGIR conference on research and development in information retrieval. SIGIR \u201906.","first-page":"405","article-title":"Document clustering with prior knowledge","author":"Ji","year":"2006"},{"issue":"6755","key":"10.1016\/j.ipm.2012.12.004_b0105","doi-asserted-by":"crossref","first-page":"788","DOI":"10.1038\/44565","article-title":"Learning the parts of objects by non-negative matrix factorization","volume":"401","author":"Lee","year":"1999","journal-title":"Nature"},{"key":"10.1016\/j.ipm.2012.12.004_b0110","unstructured":"Lee, D. D., & Seung, H. S. (2000). Algorithms for non-negative matrix factorization. In: NIPS (pp. 556\u2013562)."},{"key":"10.1016\/j.ipm.2012.12.004_b0115","unstructured":"Liu, C.-L., Hsaio, W.-H., Lee, C.-H., & Chen, C.-H. (2011). Document clustering with labeled and unlabeled data using constrained-PLSA. Tech. rep. Department of Computer Science, National Chiao Tung University. <http:\/\/islab.cis.nctu.edu.tw\/report\/constrained-PLSA.pdf>."},{"issue":"3","key":"10.1016\/j.ipm.2012.12.004_b0120","doi-asserted-by":"crossref","first-page":"397","DOI":"10.1109\/TSMCC.2011.2136334","article-title":"Movie rating and review summarization in mobile environment","volume":"42","author":"Liu","year":"2012","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics, Part C"},{"key":"10.1016\/j.ipm.2012.12.004_b0125","series-title":"Introduction to information retrieval","author":"Manning","year":"2008"},{"key":"10.1016\/j.ipm.2012.12.004_b0130","first-page":"849","article-title":"On spectral clustering: analysis and an algorithm","volume":"Vol. 14","author":"Ng","year":"2001"},{"issue":"May","key":"10.1016\/j.ipm.2012.12.004_b0135","doi-asserted-by":"crossref","first-page":"103","DOI":"10.1023\/A:1007692713085","article-title":"Text classification from labeled and unlabeled documents using EM","volume":"39","author":"Nigam","year":"2000","journal-title":"Machine Learning"},{"key":"10.1016\/j.ipm.2012.12.004_b0140","series-title":"Proceedings of the 26th annual international conference on machine learning. ICML \u201909.","first-page":"841","article-title":"An efficient sparse metric learning in high-dimensional space via l1-penalized log-determinant regularization","author":"Qi","year":"2009"},{"key":"10.1016\/j.ipm.2012.12.004_b0145","series-title":"WSDM \u201909: Proceedings of the second ACM international conference on web search and data mining","first-page":"54","article-title":"Clustering the tagged web","author":"Ramage","year":"2009"},{"issue":"8","key":"10.1016\/j.ipm.2012.12.004_b0150","doi-asserted-by":"crossref","first-page":"888","DOI":"10.1109\/34.868688","article-title":"Normalized cuts and image segmentation","volume":"22","author":"Shi","year":"2000","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"10.1016\/j.ipm.2012.12.004_b0155","doi-asserted-by":"crossref","unstructured":"Shi, X., Tseng, B. L., & Adamic, L. A. (2009). Information diffusion in computer science citation networks. In ICWSM.","DOI":"10.1609\/icwsm.v3i1.13974"},{"key":"10.1016\/j.ipm.2012.12.004_b0160","series-title":"Proceedings of the eighteenth international conference on machine learning. ICML \u201901.","first-page":"577","article-title":"Constrained K-means clustering with background knowledge","author":"Wagstaff","year":"2001"},{"key":"10.1016\/j.ipm.2012.12.004_b0165","series-title":"Proceedings of the 17th ACM conference on Information and knowledge management. CIKM \u201908.","first-page":"1457","article-title":"Semi-supervised metric learning by maximizing constraint margin","author":"Wang","year":"2008"},{"key":"10.1016\/j.ipm.2012.12.004_b0170","doi-asserted-by":"crossref","unstructured":"Wang, F., Li, T., & Zhang, C. (2008). Semi-supervised clustering via matrix factorization. In SDM (pp. 1\u201312).","DOI":"10.1137\/1.9781611972788.1"},{"key":"10.1016\/j.ipm.2012.12.004_b0175","series-title":"Proceedings of the 30th annual international ACM SIGIR conference on research and development in information retrieval. SIGIR \u201907.","first-page":"95","article-title":"Regularized clustering for documents","author":"Wang","year":"2007"},{"key":"10.1016\/j.ipm.2012.12.004_b0180","series-title":"Proceedings of the 27th international conference on machine learning (ICML-10).","first-page":"1135","article-title":"A new analysis of co-training","author":"Wang","year":"2010"},{"key":"10.1016\/j.ipm.2012.12.004_b0185","series-title":"Proceedings of the 16th ACM SIGKDD international conference on Knowledge discovery and data mining. KDD \u201910.","first-page":"563","article-title":"Flexible constrained spectral clustering","author":"Wang","year":"2010"},{"key":"10.1016\/j.ipm.2012.12.004_b0190","series-title":"Proceedings of the 17th international conference on World Wide Web. WWW \u201908.","first-page":"715","article-title":"Exploring social annotations for information retrieval","author":"Zhou","year":"2008"}],"container-title":["Information Processing &amp; Management"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0306457312001422?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0306457312001422?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2024,5,4]],"date-time":"2024-05-04T22:18:08Z","timestamp":1714861088000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0306457312001422"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,5]]},"references-count":38,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2013,5]]}},"alternative-id":["S0306457312001422"],"URL":"https:\/\/doi.org\/10.1016\/j.ipm.2012.12.004","relation":{},"ISSN":["0306-4573"],"issn-type":[{"value":"0306-4573","type":"print"}],"subject":[],"published":{"date-parts":[[2013,5]]}}}