{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,8]],"date-time":"2026-04-08T15:54:40Z","timestamp":1775663680945,"version":"3.50.1"},"reference-count":42,"publisher":"Elsevier BV","issue":"1","license":[{"start":{"date-parts":[[2005,1,1]],"date-time":"2005-01-01T00:00:00Z","timestamp":1104537600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Computational Statistics &amp; Data Analysis"],"published-print":{"date-parts":[[2005,1]]},"DOI":"10.1016\/j.csda.2003.11.027","type":"journal-article","created":{"date-parts":[[2004,2,10]],"date-time":"2004-02-10T10:17:53Z","timestamp":1076408273000},"page":"69-85","source":"Crossref","is-referenced-by-count":141,"title":["PCA and PLS with very large data sets"],"prefix":"10.1016","volume":"48","author":[{"given":"Nouna","family":"Kettaneh","sequence":"first","affiliation":[]},{"given":"Anders","family":"Berglund","sequence":"additional","affiliation":[]},{"given":"Svante","family":"Wold","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.csda.2003.11.027_BIB1","doi-asserted-by":"crossref","unstructured":"Andersson, C., Bro, R. (Eds.), 2000. Multiway analysis (special issue). J. Chemometr. 14, 103\u2013334.","DOI":"10.1002\/1099-128X(200005\/06)14:3<103::AID-CEM624>3.0.CO;2-L"},{"key":"10.1016\/j.csda.2003.11.027_BIB2","doi-asserted-by":"crossref","first-page":"415","DOI":"10.1002\/(SICI)1099-128X(199905\/08)13:3\/4<415::AID-CEM544>3.0.CO;2-8","article-title":"Multiscale analysis and modelling using wavelets","volume":"13","author":"Bakshi","year":"1999","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB3","doi-asserted-by":"crossref","first-page":"141","DOI":"10.1002\/(SICI)1099-128X(199703)11:2<141::AID-CEM461>3.0.CO;2-2","article-title":"INLR; implicit non-linear latent variable regression","volume":"11","author":"Berglund","year":"1996","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB4","doi-asserted-by":"crossref","first-page":"321","DOI":"10.1002\/cem.679","article-title":"The GIFI approach to non-linear PLS modeling","volume":"15","author":"Berglund","year":"2001","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB5","unstructured":"Box, G.E.P., 1973. Department of Statistics, Madison, WI, USA (This message was given frequently in Box's scientific talks and seminars, including the famous Monday night seminars addressing various problems of statistics applied to science and engineering)."},{"key":"10.1016\/j.csda.2003.11.027_BIB6","doi-asserted-by":"crossref","first-page":"73","DOI":"10.1002\/(SICI)1099-128X(199701)11:1<73::AID-CEM435>3.0.CO;2-#","article-title":"Improved PLS algorithms","volume":"11","author":"Dayal","year":"1997","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB7","doi-asserted-by":"crossref","unstructured":"Eld\u00e9n, L., 2003. Partial least-squares vs. Lanczos bidiagonalization\u2014I: analysis of a projection method for multiple regression. Comput. Statist. Data Anal., in press.","DOI":"10.1016\/S0167-9473(03)00138-5"},{"key":"10.1016\/j.csda.2003.11.027_BIB8","doi-asserted-by":"crossref","first-page":"139","DOI":"10.1016\/0169-7439(92)80099-P","article-title":"The H-principle in modelling with application in chemometrics","volume":"14","author":"H\u00f6skuldsson","year":"1992","journal-title":"Chemometr. Intell. Lab. Systems"},{"key":"10.1016\/j.csda.2003.11.027_BIB9","unstructured":"H\u00f6skuldsson, A., 1996. Prediction Methods in Science and Technology, Vol. 1. Thor Publishing, Copenhagen, ISBN 87-985941-0-9."},{"key":"10.1016\/j.csda.2003.11.027_BIB10","series-title":"A User's Guide to Principal Components","author":"Jackson","year":"1991"},{"key":"10.1016\/j.csda.2003.11.027_BIB11","unstructured":"Kl\u00f6sgen, W., Zytkow, J. (Eds.), 2001. Handbook of Data Mining and Knowledge Discovery. Oxford University Press, Oxford."},{"key":"10.1016\/j.csda.2003.11.027_BIB12","doi-asserted-by":"crossref","unstructured":"Kowalski, B.R. (Ed.), 1984. Chemometrics: Mathematics and Statistics in Chemistry, Reidel, Dordrecht, Holland.","DOI":"10.1007\/978-94-017-1026-8"},{"key":"10.1016\/j.csda.2003.11.027_BIB13","doi-asserted-by":"crossref","first-page":"5632","DOI":"10.1021\/ja00771a016","article-title":"Pattern recognition. A powerful approach to interpreting chemical data","volume":"94","author":"Kowalski","year":"1972","journal-title":"J. Amer. Chem. Soc"},{"key":"10.1016\/j.csda.2003.11.027_BIB14","doi-asserted-by":"crossref","first-page":"45","DOI":"10.1002\/cem.1180070104","article-title":"The Kernel algorithm for PLS","volume":"7","author":"Lindgren","year":"1993","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB15","doi-asserted-by":"crossref","first-page":"1320","DOI":"10.1021\/jm991118x","article-title":"Statistical molecular design of building blocks for combinatorial chemistry","volume":"43","author":"Linusson","year":"2000","journal-title":"J. Med. Chem"},{"key":"10.1016\/j.csda.2003.11.027_BIB16","series-title":"Computer-Assisted Lead Finding and Optimization. Current Tools for Medicinal Chemistry","first-page":"190","article-title":"Intelligent combinatorial libraries","author":"Lundstedt","year":"1997"},{"key":"10.1016\/j.csda.2003.11.027_BIB17","unstructured":"MacGregor, J., 2002. Latent variable methods in chemometrics: theoretical foundations and practical implications (SSC7 special issue). J. Chemometr."},{"key":"10.1016\/j.csda.2003.11.027_BIB18","doi-asserted-by":"crossref","first-page":"336","DOI":"10.1198\/004017001316975925","article-title":"Clustering massive data sets with applications in software metrics and tomography (with discussion)","volume":"43","author":"Maitra","year":"2001","journal-title":"Technometrics"},{"key":"10.1016\/j.csda.2003.11.027_BIB19","series-title":"Multivariate Calibration","author":"Martens","year":"1989"},{"key":"10.1016\/j.csda.2003.11.027_BIB20","doi-asserted-by":"crossref","first-page":"81","DOI":"10.1037\/h0043158","article-title":"The magical number seven, plus minus two","volume":"63","author":"Miller","year":"1956","journal-title":"Psychol. Rev"},{"issue":"3\u20134","key":"10.1016\/j.csda.2003.11.027_BIB21","doi-asserted-by":"crossref","first-page":"435","DOI":"10.1002\/(SICI)1099-128X(199905\/08)13:3\/4<435::AID-CEM549>3.0.CO;2-S","article-title":"The flexibility of fuzzy clustering illustrated by examples","volume":"13","author":"N\u00e6s","year":"1999","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB22","doi-asserted-by":"crossref","first-page":"45","DOI":"10.1016\/S0169-7439(96)00007-X","article-title":"Missing data methods in PCA and PLS; score calculations with incomplete observations","volume":"35","author":"Nelson","year":"1996","journal-title":"Chemometr. Intell. Lab. Systems"},{"key":"10.1016\/j.csda.2003.11.027_BIB23","doi-asserted-by":"crossref","unstructured":"Nguyen, D.V., Rocke, D.M., 2003. On partial least-squares dimension reduction for microarray-based classification: a simulation study. Comput. Statist. Data Anal., in press.","DOI":"10.1016\/j.csda.2003.08.001"},{"issue":"6","key":"10.1016\/j.csda.2003.11.027_BIB24","doi-asserted-by":"crossref","first-page":"418","DOI":"10.1038\/35076576","article-title":"Computational analysis of microarray data","volume":"2","author":"Quackenbush","year":"2001","journal-title":"Nat. Rev. Genet"},{"key":"10.1016\/j.csda.2003.11.027_BIB25","doi-asserted-by":"crossref","first-page":"111","DOI":"10.1002\/cem.1180080204","article-title":"A PLS Kernel algorithm for data sets with many variables and less objects. Part I. Theory and algorithms","volume":"8","author":"R\u00e4nnar","year":"1994","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB26","doi-asserted-by":"crossref","first-page":"459","DOI":"10.1002\/cem.1180090604","article-title":"A PLS Kernel algorithm for data sets with many variables and less objects. Part 2. Cross-validation, missing data, and examples","volume":"9","author":"R\u00e4nnar","year":"1995","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB27","doi-asserted-by":"crossref","first-page":"185","DOI":"10.1002\/cem.1180010306","article-title":"Partial least squares analysis with cross-validation for the two-class problem","volume":"1","author":"Stahle","year":"1987","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB28","unstructured":"Subramaniam, S., 2000. Bioinformatics. Talk at the Euchem BCDC symposium, Sigtuna, Sweden, September 2000."},{"key":"10.1016\/j.csda.2003.11.027_BIB29","unstructured":"Tenenhaus, M., 1998. La Regression PLS: Theorie et Pratique. Technip, Paris."},{"key":"10.1016\/j.csda.2003.11.027_BIB30","unstructured":"Torre, F., et al. 2002. Data mining issues on multivariate online industrial control (SSC7 special issue). J. Chemometr."},{"key":"10.1016\/j.csda.2003.11.027_BIB31","doi-asserted-by":"crossref","first-page":"209","DOI":"10.1016\/S0169-7439(98)00013-6","article-title":"PLS regression on wavelet compressed NIR spectra","volume":"42","author":"Trygg","year":"1998","journal-title":"Chemometr. Intell. Lab. Systems"},{"key":"10.1016\/j.csda.2003.11.027_BIB32","doi-asserted-by":"crossref","first-page":"299","DOI":"10.1002\/cem.681","article-title":"2-D wavelet analysis and compression of on-line industrial process data","volume":"15","author":"Trygg","year":"2001","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB33","series-title":"Statistical Modeling by Wavelets","author":"Vidakovic","year":"1999"},{"key":"10.1016\/j.csda.2003.11.027_BIB34","unstructured":"Wentzell, P., 2002. Case studies in the applications of maximum likelihood principal components analysis (SSC7 special issue). J. Chemometr."},{"issue":"5","key":"10.1016\/j.csda.2003.11.027_BIB35","doi-asserted-by":"crossref","first-page":"301","DOI":"10.1002\/(SICI)1099-128X(199809\/10)12:5<301::AID-CEM515>3.0.CO;2-S","article-title":"Analysis of multiblock and hierarchical PCA and PLS models","volume":"12","author":"Westerhuis","year":"1998","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB36","doi-asserted-by":"crossref","first-page":"127","DOI":"10.1016\/0031-3203(76)90014-5","article-title":"Pattern recognition by means of disjoint principal components models","volume":"8","author":"Wold","year":"1976","journal-title":"Pattern Recognition"},{"key":"10.1016\/j.csda.2003.11.027_BIB37","unstructured":"Wold, H., 1982. Soft modeling. The basic design and some extensions. In: Joreskog, K.-G., Wold, H. (Eds.), Systems Under Indirect Observation, Vols. I and II. North-Holland, Amsterdam (Chapter 1 of Vol. II)."},{"key":"10.1016\/j.csda.2003.11.027_BIB38","doi-asserted-by":"crossref","first-page":"589","DOI":"10.1016\/0731-7085(91)80183-A","article-title":"Chemometrics, why, what and where to next?","volume":"9","author":"Wold","year":"1991","journal-title":"J. Pharmaceut. Biomed. Anal"},{"key":"10.1016\/j.csda.2003.11.027_BIB39","series-title":"Wiley Encyclopedia of Analytical Chemistry","first-page":"9710","article-title":"Multivariate calibration of analytical data","author":"Wold","year":"2000"},{"key":"10.1016\/j.csda.2003.11.027_BIB40","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1016\/0169-7439(87)80084-9","article-title":"Principal components analysis","volume":"2","author":"Wold","year":"1987","journal-title":"Chemometr. Intell. Lab. System"},{"key":"10.1016\/j.csda.2003.11.027_BIB41","doi-asserted-by":"crossref","first-page":"463","DOI":"10.1002\/(SICI)1099-128X(199609)10:5\/6<463::AID-CEM445>3.0.CO;2-L","article-title":"Hierarchical multi-block PLS and PC models, for easier interpretation, and as an alternative to variable selection","volume":"10","author":"Wold","year":"1996","journal-title":"J. Chemometr"},{"key":"10.1016\/j.csda.2003.11.027_BIB42","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1016\/S0169-7439(01)00155-1","article-title":"PLS-Regression: a basic tool of chemometrics","volume":"58","author":"Wold","year":"2001","journal-title":"Chemometr. Intell. Lab. Systems"}],"container-title":["Computational Statistics &amp; Data Analysis"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167947303002949?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167947303002949?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2020,3,30]],"date-time":"2020-03-30T17:09:03Z","timestamp":1585588143000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0167947303002949"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2005,1]]},"references-count":42,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2005,1]]}},"alternative-id":["S0167947303002949"],"URL":"https:\/\/doi.org\/10.1016\/j.csda.2003.11.027","relation":{},"ISSN":["0167-9473"],"issn-type":[{"value":"0167-9473","type":"print"}],"subject":[],"published":{"date-parts":[[2005,1]]}}}