diff --git a/DESCRIPTION b/DESCRIPTION
index cd6d9e6..19399d9 100644
--- a/DESCRIPTION
+++ b/DESCRIPTION
@@ -1,7 +1,7 @@
 Package: mdatools
 Title: Multivariate Data Analysis for Chemometrics
-Version: 0.8.0
-Date: 2016-10-07
+Version: 0.8.1
+Date: 2016-10-30
 Author: Sergey Kucheryavskiy
 Maintainer: Sergey Kucheryavskiy <svkucheryavski@gmail.com>
 Description: Package implements projection based methods for preprocessing,
diff --git a/NEWS b/NEWS
index 300271f..4175b92 100755
--- a/NEWS
+++ b/NEWS
@@ -1,3 +1,9 @@
+v.0.8.1
+=======
+* fixed a bug in PCA when explained variance was calculated incorrectly for data with excluded rows
+* fixed several issues with SIMCA (cross-validation) and SIMCAM (Cooman's plot)
+* added a chapter about SIMCA to the tutorial
+
 v.0.8.0
 =======
 * tutorial has been moved from GitBook to Bookdown and fully rewritten
diff --git a/NEWS.md b/NEWS.md
index 300271f..4175b92 100755
--- a/NEWS.md
+++ b/NEWS.md
@@ -1,3 +1,9 @@
+v.0.8.1
+=======
+* fixed a bug in PCA when explained variance was calculated incorrectly for data with excluded rows
+* fixed several issues with SIMCA (cross-validation) and SIMCAM (Cooman's plot)
+* added a chapter about SIMCA to the tutorial
+
 v.0.8.0
 =======
 * tutorial has been moved from GitBook to Bookdown and fully rewritten
diff --git a/R/ldecomp.R b/R/ldecomp.R
index 2f9a4d4..1792098 100755
--- a/R/ldecomp.R
+++ b/R/ldecomp.R
@@ -238,11 +238,13 @@ ldecomp.getVariances = function(Q, totvar) {
    cumresvar = colSums(Q) / totvar * 100
    cumexpvar = 100 - cumresvar
    expvar = c(cumexpvar[1], diff(cumexpvar))
-   
+  
    res = list(
       expvar = expvar,
       cumexpvar = cumexpvar
    )
+   
+   res
 }
 
 #' Statistical limits for Q and T2 residuals
diff --git a/R/pca.R b/R/pca.R
index a58340e..4cab0ab 100755
--- a/R/pca.R
+++ b/R/pca.R
@@ -685,13 +685,17 @@ predict.pca = function(object, x, cal = FALSE, ...) {
    x = prep.autoscale(x, center = object$center, scale = object$scale)
    scores = x %*% object$loadings
    residuals = x - tcrossprod(scores, object$loadings)
-      
+     
    # compute total variance
    if (length(object$exclcols) > 0){
       x = x[, -object$exclcols, drop = F]
       attrs$exclcols = object$exclcols      
    }
    
+   if (length(attrs$exclrows) > 0){
+      x = x[-object$exclrows, ,drop = F]
+   }
+   
    totvar = sum(x^2)
    
    # create and return the results object
diff --git a/R/simca.R b/R/simca.R
index bdb58f1..c503c34 100755
--- a/R/simca.R
+++ b/R/simca.R
@@ -324,20 +324,14 @@ simca.crossval = function(model, x, cv, center = T, scale = F) {
             Q[ind, ] = Q[ind, ] + res$Q
             T2[ind, ] = T2[ind, ] + res$T2
             
-            # compute limits
-            lim = ldecomp.getResLimits(m$eigenvals, nrow(x.cal), ncomp, model$alpha)
-            Qlim = Qlim + lim$Qlim
-            T2lim = T2lim + lim$T2lim
          }
       }  
    }
    
    Q = Q / nrep;
    T2 = T2 / nrep;
-   Qlim = Qlim / nrep;
-   T2lim = T2lim / nrep;
    
-   m = list(Qlim = Qlim, T2lim = T2lim, classname = model$classname, ncomp = model$ncomp)
+   m = list(Qlim = model$Qlim, T2lim = model$T2lim, classname = model$classname, ncomp = model$ncomp)
    r = list(Q = Q, T2 = T2, classname = model$classname)
    c.pred = simca.classify(m, r)
    
diff --git a/R/simcam.R b/R/simcam.R
index 8691be7..fa5873c 100755
--- a/R/simcam.R
+++ b/R/simcam.R
@@ -166,7 +166,6 @@ predict.simcam = function(object, x, c.ref = NULL, cv = F, ...) {
       pred.res[[i]] = predict(object$models[[i]], x, c.ref)
       c.pred[, , i] = pred.res[[i]]$c.pred[, object$models[[i]]$ncomp.selected, ]
    }
-   
    dimnames(c.pred) = list(rownames(x), paste('Comp'), object$classnames)
    c.pred = mda.setattr(c.pred, attrs, 'row')
    attr(c.pred, 'name') = 'SIMCAM predictions'
diff --git a/R/simcamres.R b/R/simcamres.R
index 8baf644..fdbf7eb 100755
--- a/R/simcamres.R
+++ b/R/simcamres.R
@@ -179,7 +179,7 @@ plotCooman.simcamres = function(obj, nc = c(1, 2), type = 'p', main = "Cooman's
    attrs = mda.getattr(obj$c.pred)
    res1 = obj$pred.res[[nc[1]]]
    res2 = obj$pred.res[[nc[2]]]
-   data = cbind(sqrt(res1$Q[, res1$ncomp.selected]), sqrt(res2$Q[, res2$ncomp.selected]))
+   data = cbind(res1$Q[, res1$ncomp.selected], res2$Q[, res2$ncomp.selected])
    rownames(data) = rownames(obj$c.pred)
    data = mda.setattr(data, attrs, 'row') 
    if (show.limits == T)
diff --git a/docs/_main_files/figure-html/unnamed-chunk-43-1.png b/docs/_main_files/figure-html/unnamed-chunk-43-1.png
index 52ed672..2d0d327 100644
Binary files a/docs/_main_files/figure-html/unnamed-chunk-43-1.png and b/docs/_main_files/figure-html/unnamed-chunk-43-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-5-1.png b/docs/_main_files/figure-html/unnamed-chunk-5-1.png
new file mode 100644
index 0000000..d539b78
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-5-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-61-1.png b/docs/_main_files/figure-html/unnamed-chunk-61-1.png
index d85c05a..b83f13e 100644
Binary files a/docs/_main_files/figure-html/unnamed-chunk-61-1.png and b/docs/_main_files/figure-html/unnamed-chunk-61-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-7-1.png b/docs/_main_files/figure-html/unnamed-chunk-7-1.png
new file mode 100644
index 0000000..d91a2d3
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-7-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-8-1.png b/docs/_main_files/figure-html/unnamed-chunk-8-1.png
new file mode 100644
index 0000000..6d22954
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-8-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-88-1.png b/docs/_main_files/figure-html/unnamed-chunk-88-1.png
new file mode 100644
index 0000000..caa592f
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-88-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-89-1.png b/docs/_main_files/figure-html/unnamed-chunk-89-1.png
new file mode 100644
index 0000000..d539b78
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-89-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-91-1.png b/docs/_main_files/figure-html/unnamed-chunk-91-1.png
new file mode 100644
index 0000000..d91a2d3
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-91-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-92-1.png b/docs/_main_files/figure-html/unnamed-chunk-92-1.png
new file mode 100644
index 0000000..6d22954
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-92-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-95-1.png b/docs/_main_files/figure-html/unnamed-chunk-95-1.png
new file mode 100644
index 0000000..55d3eed
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-95-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-97-1.png b/docs/_main_files/figure-html/unnamed-chunk-97-1.png
new file mode 100644
index 0000000..1e6c325
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-97-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-98-1.png b/docs/_main_files/figure-html/unnamed-chunk-98-1.png
new file mode 100644
index 0000000..184b26c
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-98-1.png differ
diff --git a/docs/_main_files/figure-html/unnamed-chunk-99-1.png b/docs/_main_files/figure-html/unnamed-chunk-99-1.png
new file mode 100644
index 0000000..c16cc72
Binary files /dev/null and b/docs/_main_files/figure-html/unnamed-chunk-99-1.png differ
diff --git a/docs/attributes-and-factors.html b/docs/attributes-and-factors.html
index 7c581a9..fb89c9f 100644
--- a/docs/attributes-and-factors.html
+++ b/docs/attributes-and-factors.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/calibration-and-validation.html b/docs/calibration-and-validation.html
new file mode 100644
index 0000000..92c8b5f
--- /dev/null
+++ b/docs/calibration-and-validation.html
@@ -0,0 +1,349 @@
+<!DOCTYPE html>
+<html >
+
+<head>
+
+  <meta charset="UTF-8">
+  <meta http-equiv="X-UA-Compatible" content="IE=edge">
+  <title>Getting started with mdatools for R</title>
+  <meta content="text/html; charset=UTF-8" http-equiv="Content-Type">
+  <meta name="description" content="This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect most of the common chemometric methods and give a similar user interface for using them. So if a user knows how to make a model and visualise results for one method, he or she can easily do this for the others.">
+  <meta name="generator" content="bookdown 0.1 and GitBook 2.6.7">
+
+  <meta property="og:title" content="Getting started with mdatools for R" />
+  <meta property="og:type" content="book" />
+  
+  
+  <meta property="og:description" content="This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect most of the common chemometric methods and give a similar user interface for using them. So if a user knows how to make a model and visualise results for one method, he or she can easily do this for the others." />
+  <meta name="github-repo" content="svkucheryavski/mdatools.bookdown" />
+
+  <meta name="twitter:card" content="summary" />
+  <meta name="twitter:title" content="Getting started with mdatools for R" />
+  
+  <meta name="twitter:description" content="This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect most of the common chemometric methods and give a similar user interface for using them. So if a user knows how to make a model and visualise results for one method, he or she can easily do this for the others." />
+  
+
+<meta name="author" content="Sergey Kucheryavskiy">
+
+<meta name="date" content="2016-10-30">
+
+<script type="text/x-mathjax-config">
+MathJax.Hub.Config({
+  TeX: { equationNumbers: { autoNumber: "AMS" } }
+});
+</script>
+
+  <meta name="viewport" content="width=device-width, initial-scale=1">
+  <meta name="apple-mobile-web-app-capable" content="yes">
+  <meta name="apple-mobile-web-app-status-bar-style" content="black">
+  
+  
+<link rel="prev" href="simca-classification.html">
+<link rel="next" href="multiclass-classification.html">
+
+<script src="libs/jquery-2.2.3/jquery.min.js"></script>
+<link href="libs/gitbook-2.6.7/css/style.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-bookdown.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-highlight.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-search.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-fontsettings.css" rel="stylesheet" />
+
+
+
+
+
+
+
+
+
+<style type="text/css">
+div.sourceCode { overflow-x: auto; }
+table.sourceCode, tr.sourceCode, td.lineNumbers, td.sourceCode {
+  margin: 0; padding: 0; vertical-align: baseline; border: none; }
+table.sourceCode { width: 100%; line-height: 100%; }
+td.lineNumbers { text-align: right; padding-right: 4px; padding-left: 4px; color: #aaaaaa; border-right: 1px solid #aaaaaa; }
+td.sourceCode { padding-left: 5px; }
+code > span.kw { color: #007020; font-weight: bold; } /* Keyword */
+code > span.dt { color: #902000; } /* DataType */
+code > span.dv { color: #40a070; } /* DecVal */
+code > span.bn { color: #40a070; } /* BaseN */
+code > span.fl { color: #40a070; } /* Float */
+code > span.ch { color: #4070a0; } /* Char */
+code > span.st { color: #4070a0; } /* String */
+code > span.co { color: #60a0b0; font-style: italic; } /* Comment */
+code > span.ot { color: #007020; } /* Other */
+code > span.al { color: #ff0000; font-weight: bold; } /* Alert */
+code > span.fu { color: #06287e; } /* Function */
+code > span.er { color: #ff0000; font-weight: bold; } /* Error */
+code > span.wa { color: #60a0b0; font-weight: bold; font-style: italic; } /* Warning */
+code > span.cn { color: #880000; } /* Constant */
+code > span.sc { color: #4070a0; } /* SpecialChar */
+code > span.vs { color: #4070a0; } /* VerbatimString */
+code > span.ss { color: #bb6688; } /* SpecialString */
+code > span.im { } /* Import */
+code > span.va { color: #19177c; } /* Variable */
+code > span.cf { color: #007020; font-weight: bold; } /* ControlFlow */
+code > span.op { color: #666666; } /* Operator */
+code > span.bu { } /* BuiltIn */
+code > span.ex { } /* Extension */
+code > span.pp { color: #bc7a00; } /* Preprocessor */
+code > span.at { color: #7d9029; } /* Attribute */
+code > span.do { color: #ba2121; font-style: italic; } /* Documentation */
+code > span.an { color: #60a0b0; font-weight: bold; font-style: italic; } /* Annotation */
+code > span.cv { color: #60a0b0; font-weight: bold; font-style: italic; } /* CommentVar */
+code > span.in { color: #60a0b0; font-weight: bold; font-style: italic; } /* Information */
+</style>
+
+</head>
+
+<body>
+
+
+  <div class="book without-animation with-summary font-size-2 font-family-1" data-basepath=".">
+
+    <div class="book-summary">
+      <nav role="navigation">
+
+<ul class="summary">
+<li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
+<li class="chapter" data-level="" data-path="what-mdatools-can-do.html"><a href="what-mdatools-can-do.html"><i class="fa fa-check"></i>What mdatools can do?</a></li>
+<li class="chapter" data-level="" data-path="how-to-install.html"><a href="how-to-install.html"><i class="fa fa-check"></i>How to install</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="datasets-and-plots.html"><a href="datasets-and-plots.html"><i class="fa fa-check"></i>Datasets and plots</a><ul>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html"><i class="fa fa-check"></i>Attributes and factors</a><ul>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#package-specific-attributes"><i class="fa fa-check"></i>Package specific attributes</a></li>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#attributes-for-plots"><i class="fa fa-check"></i>Attributes for plots</a></li>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#special-methods-for-data-transformations"><i class="fa fa-check"></i>Special methods for data transformations</a></li>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#data-frames-with-factors"><i class="fa fa-check"></i>Data frames with factors</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html"><i class="fa fa-check"></i>Simple plots</a><ul>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html#scatter-plots"><i class="fa fa-check"></i>Scatter plots</a></li>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html#line-plots"><i class="fa fa-check"></i>Line plots</a></li>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html#bar-and-errorbar-plots"><i class="fa fa-check"></i>Bar and errorbar plots</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html"><i class="fa fa-check"></i>Plots for groups of objects</a><ul>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html#one-matrix-or-data-frame"><i class="fa fa-check"></i>One matrix or data frame</a></li>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html#list-with-matrices-or-data-frames"><i class="fa fa-check"></i>List with matrices or data frames</a></li>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html#use-factors-to-split-a-dataset-into-groups"><i class="fa fa-check"></i>Use factors to split a dataset into groups</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="working-with-images.html"><a href="working-with-images.html"><i class="fa fa-check"></i>Working with images</a></li>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html"><i class="fa fa-check"></i>Preprocessing</a><ul>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html#autoscaling"><i class="fa fa-check"></i>Autoscaling</a></li>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html#correction-of-spectral-baseline"><i class="fa fa-check"></i>Correction of spectral baseline</a></li>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html#smoothing-and-derivatives"><i class="fa fa-check"></i>Smoothing and derivatives</a></li>
+</ul></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="principal-component-analysis.html"><a href="principal-component-analysis.html"><i class="fa fa-check"></i>Principal component analysis</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results.html"><a href="models-and-results.html"><i class="fa fa-check"></i>Models and results</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results.html"><a href="models-and-results.html#model-calibration"><i class="fa fa-check"></i>Model calibration</a></li>
+<li class="chapter" data-level="" data-path="models-and-results.html"><a href="models-and-results.html#model-validation"><i class="fa fa-check"></i>Model validation</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html"><i class="fa fa-check"></i>Plotting methods</a><ul>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html#support-for-images"><i class="fa fa-check"></i>Support for images</a></li>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html#manual-x-values-for-loading-line-plot"><i class="fa fa-check"></i>Manual x-values for loading line plot</a></li>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html#excluding-rows-and-columns"><i class="fa fa-check"></i>Excluding rows and columns</a></li>
+</ul></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="partial-least-squares-regression.html"><a href="partial-least-squares-regression.html"><i class="fa fa-check"></i>Partial least squares regression</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results-1.html"><a href="models-and-results-1.html"><i class="fa fa-check"></i>Models and results</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results-1.html"><a href="models-and-results-1.html#model-calibration-1"><i class="fa fa-check"></i>Model calibration</a></li>
+<li class="chapter" data-level="" data-path="models-and-results-1.html"><a href="models-and-results-1.html#model-validation-1"><i class="fa fa-check"></i>Model validation</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="plotting-methods-1.html"><a href="plotting-methods-1.html"><i class="fa fa-check"></i>Plotting methods</a><ul>
+<li class="chapter" data-level="" data-path="plotting-methods-1.html"><a href="plotting-methods-1.html#excluding-rows-and-columns-1"><i class="fa fa-check"></i>Excluding rows and columns</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
+</ul>
+
+      </nav>
+    </div>
+
+    <div class="book-body">
+      <div class="body-inner">
+        <div class="book-header" role="navigation">
+          <h1>
+            <i class="fa fa-circle-o-notch fa-spin"></i><a href="./">Getting started with mdatools for R</a>
+          </h1>
+        </div>
+
+        <div class="page-wrapper" tabindex="-1" role="main">
+          <div class="page-inner">
+
+            <section class="normal" id="section-">
+<div id="calibration-and-validation" class="section level2 unnumbered">
+<h2>Calibration and validation</h2>
+<p>The model calibration is similar to PCA, but there are several additional arguments, which are important for classification. First of all it is a class name. Class name is a string, which can be used later e.g. for identifying class members for testing. The second important argument is a level of significance, <code>alpha</code>. This parameter is used for calculation of statistical limits and can be considered as probability for false negatives. The default value is 0.05.</p>
+<p>In this chapter as well as for describing other classification methods we will use a famous Iris dataset, available in R. The dataset includes 150 measurements of three Iris species: <em>Setosa</em>, <em>Virginica</em> and <em>Versicola</em>. The measurements are length and width of petals and sepals in cm. Use <code>?iris</code> for more details.</p>
+<p>Let’s get the data and split it to calibration and test sets.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">data</span>(iris)
+<span class="kw">head</span>(iris)</code></pre></div>
+<pre><code>##   Sepal.Length Sepal.Width Petal.Length Petal.Width Species
+## 1          5.1         3.5          1.4         0.2  setosa
+## 2          4.9         3.0          1.4         0.2  setosa
+## 3          4.7         3.2          1.3         0.2  setosa
+## 4          4.6         3.1          1.5         0.2  setosa
+## 5          5.0         3.6          1.4         0.2  setosa
+## 6          5.4         3.9          1.7         0.4  setosa</code></pre>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="co"># generate indices for calibration set</span>
+idx =<span class="st"> </span><span class="kw">seq</span>(<span class="dv">1</span>, <span class="kw">nrow</span>(iris), <span class="dt">by =</span> <span class="dv">2</span>)
+
+<span class="co"># split the values</span>
+X.c =<span class="st"> </span>iris[idx, <span class="dv">1</span>:<span class="dv">4</span>]
+c.c =<span class="st"> </span>iris[idx, <span class="dv">5</span>, drop =<span class="st"> </span>F]
+
+X.t =<span class="st"> </span>iris[-idx, <span class="dv">1</span>:<span class="dv">4</span>]
+c.t =<span class="st"> </span>iris[-idx, <span class="dv">5</span>, drop =<span class="st"> </span>F]</code></pre></div>
+<p>Now, because for calibration we need only objects belonging to a class, we will split the <code>X.c</code> into three matrices — one for each species. The data is ordered by the species, so it can be done relatively easy by taking every 25 rows.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r">X.set =<span class="st"> </span>X.c[<span class="dv">1</span>:<span class="dv">25</span>, ]
+X.ver =<span class="st"> </span>X.c[<span class="dv">26</span>:<span class="dv">50</span>, ]
+X.vir =<span class="st"> </span>X.c[<span class="dv">51</span>:<span class="dv">75</span>, ]</code></pre></div>
+<p>Let’s start with creating a model for class <em>Versicolor</em> and exploring available statistics and plots. We will use full cross-validation to validate the results.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">library</span>(mdatools)
+m =<span class="st"> </span><span class="kw">simca</span>(X.ver, <span class="st">&#39;versicolor&#39;</span>, <span class="dt">ncomp =</span> <span class="dv">3</span>, <span class="dt">cv =</span> <span class="dv">1</span>)
+<span class="kw">summary</span>(m)</code></pre></div>
+<pre><code>## 
+## SIMCA model for class &quot;versicolor&quot; summary
+## 
+## Info: 
+## Significance level (alpha): 0.05
+## Selected number of components: 3
+## 
+##        Expvar Cumexpvar Sens (cal) Expvar (cv) Sens (cv)
+## Comp 1  76.44     76.44       0.96       71.85      0.88
+## Comp 2  13.93     90.37       0.92       13.91      0.84
+## Comp 3   8.45     98.82       0.92       12.24      0.84</code></pre>
+<p>Let’s look at plots and start with summary plot.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">plot</span>(m)</code></pre></div>
+<p><img src="_main_files/figure-html/unnamed-chunk-88-1.png" width="864" /></p>
+<p>The plot is very similar to what we seen for PCA model, the only difference is that it shows <em>modelling power</em> instead of loadings. Modelling power is a measure of contribution of each variable to the model and varies from 0 to 1. Usually variables with modelling power below 0.1 are considered as irrelevant.</p>
+<p>Let’s give a closer look at the residuals plot with different values for alpha (we will keep number of components equal to three in all cases).</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r">m1 =<span class="st"> </span><span class="kw">simca</span>(X.ver, <span class="st">&#39;versicolor&#39;</span>, <span class="dt">ncomp =</span> <span class="dv">3</span>, <span class="dt">cv =</span> <span class="dv">1</span>, <span class="dt">alpha =</span> <span class="fl">0.01</span>)
+m2 =<span class="st"> </span><span class="kw">simca</span>(X.ver, <span class="st">&#39;versicolor&#39;</span>, <span class="dt">ncomp =</span> <span class="dv">3</span>, <span class="dt">cv =</span> <span class="dv">1</span>, <span class="dt">alpha =</span> <span class="fl">0.05</span>)
+m3 =<span class="st"> </span><span class="kw">simca</span>(X.ver, <span class="st">&#39;versicolor&#39;</span>, <span class="dt">ncomp =</span> <span class="dv">3</span>, <span class="dt">cv =</span> <span class="dv">1</span>, <span class="dt">alpha =</span> <span class="fl">0.10</span>)
+m4 =<span class="st"> </span><span class="kw">simca</span>(X.ver, <span class="st">&#39;versicolor&#39;</span>, <span class="dt">ncomp =</span> <span class="dv">3</span>, <span class="dt">cv =</span> <span class="dv">1</span>, <span class="dt">alpha =</span> <span class="fl">0.15</span>)
+
+<span class="kw">par</span>(<span class="dt">mfrow =</span> <span class="kw">c</span>(<span class="dv">2</span>, <span class="dv">2</span>))
+<span class="kw">plotResiduals</span>(m1)
+<span class="kw">plotResiduals</span>(m2)
+<span class="kw">plotResiduals</span>(m3)
+<span class="kw">plotResiduals</span>(m4)</code></pre></div>
+<p><img src="_main_files/figure-html/unnamed-chunk-89-1.png" width="864" /></p>
+<p>As you can see, using alpha = 0.01 reduced number of false negatives to zero, as the acceptance limits became larger, while alpha = 0.15 gives a lot of incorrectly rejected class members. It must be noted, that decreasing alpha will also lead to a larger number of false positives, which we can not see in this case.</p>
+<div id="predictions-and-validation-with-a-test-set" class="section level3 unnumbered">
+<h3>Predictions and validation with a test set</h3>
+<p>When model is ready one can test it using a new test set with know classes. In this case we will use objects from all three species and be able to see how good the model performs on strangers (and calculate the specificity). In order to do that we will provide both the matrix with predictors, <code>X.t</code>, and a vector with names of the classes for corresponding objects/rows (<code>c.t</code>). The values with known classes in this case can be:</p>
+<ul>
+<li>a vector with text values (names)</li>
+<li>a factor using the names as labels</li>
+<li>a vector with logical values (<code>TRUE</code> for class members and <code>FALSE</code> for strangers)</li>
+</ul>
+<p>In our case we have a factor. Instead of creating a new model and providing the values as test set we will make predictions instead.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r">res =<span class="st"> </span><span class="kw">predict</span>(m, X.t, c.t)
+<span class="kw">summary</span>(res)</code></pre></div>
+<pre><code>## 
+## Summary for SIMCA one-class classification result
+## 
+## Class name: versicolor
+## Number of selected components: 3
+## 
+##        Expvar Cumexpvar TP FP TN FN Spec Sens
+## Comp 1  64.27     64.27 23  5 45  2 0.90 0.92
+## Comp 2   1.67     65.95 24  3 47  1 0.94 0.96
+## Comp 3  32.45     98.40 22  3 47  3 0.94 0.88</code></pre>
+<p>In this case we see a more detailed statistics with true/false positives and negatives, specificity and sensitivity. The performance statistics can be also shown as plots.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">par</span>(<span class="dt">mfrow =</span> <span class="kw">c</span>(<span class="dv">2</span>, <span class="dv">2</span>))
+<span class="kw">plotSpecificity</span>(res)
+<span class="kw">plotSensitivity</span>(res)
+<span class="kw">plotMisclassified</span>(res)
+<span class="kw">plotPerformance</span>(res)</code></pre></div>
+<p><img src="_main_files/figure-html/unnamed-chunk-91-1.png" width="864" /></p>
+<p>The classification results can be shown both graphically and numerically. Here is a prediction plot for the results.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">par</span>(<span class="dt">mfrow =</span> <span class="kw">c</span>(<span class="dv">2</span>, <span class="dv">1</span>))
+<span class="kw">plotPredictions</span>(res)
+<span class="kw">plotPredictions</span>(res, <span class="dt">ncomp =</span> <span class="dv">2</span>)</code></pre></div>
+<p><img src="_main_files/figure-html/unnamed-chunk-92-1.png" width="864" /></p>
+<p>So we can see that for the model with three components we have no false positives (specificity = 1) and one false negative (sensitivity = 24/25 = 0.96). You can also show the predictions as a matrix with -1 and +1 using method <code>showPredictions()</code> or get the array with predicted class values directly as it is shown in the example below (for first 10 rows, different number of components and the first classification variable).</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">show</span>(res$c.pred[<span class="dv">31</span>:<span class="dv">40</span>, <span class="dv">1</span>:<span class="dv">3</span>, <span class="dv">1</span>])</code></pre></div>
+<pre><code>##    Comp 1 Comp 2 Comp 3
+## 62      1      1      1
+## 64      1      1      1
+## 66      1      1      1
+## 68      1      1     -1
+## 70      1      1      1
+## 72      1      1      1
+## 74      1      1     -1
+## 76      1      1      1
+## 78      1      1      1
+## 80      1      1      1</code></pre>
+</div>
+</div>
+            </section>
+
+          </div>
+        </div>
+      </div>
+<a href="simca-classification.html" class="navigation navigation-prev " aria-label="Previous page"><i class="fa fa-angle-left"></i></a>
+<a href="multiclass-classification.html" class="navigation navigation-next " aria-label="Next page""><i class="fa fa-angle-right"></i></a>
+
+<script src="libs/gitbook-2.6.7/js/app.min.js"></script>
+<script src="libs/gitbook-2.6.7/js/lunr.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-search.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-sharing.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-fontsettings.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-bookdown.js"></script>
+<script src="libs/gitbook-2.6.7/js/jquery.highlight.js"></script>
+<script>
+require(["gitbook"], function(gitbook) {
+gitbook.start({
+"sharing": {
+"facebook": true,
+"twitter": true,
+"google": false,
+"weibo": false,
+"instapper": false,
+"vk": false,
+"all": ["facebook", "google", "twitter", "weibo", "instapaper"]
+},
+"fontsettings": {
+"theme": "white",
+"family": "sans",
+"size": 1
+},
+"edit": {
+"link": null,
+"text": null
+},
+"download": null,
+"toc": {
+"collapse": "subsection"
+}
+});
+});
+</script>
+
+<!-- dynamically load mathjax for compatibility with self-contained -->
+<script>
+  (function () {
+    var script = document.createElement("script");
+    script.type = "text/javascript";
+    script.src  = "https://cdn.mathjax.org/mathjax/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML";
+    if (location.protocol !== "file:" && /^https?:/.test(script.src))
+      script.src  = script.src.replace(/^https?:/, '');
+    document.getElementsByTagName("head")[0].appendChild(script);
+  })();
+</script>
+</body>
+
+</html>
diff --git a/docs/datasets-and-plots.html b/docs/datasets-and-plots.html
index cce8827..c25f48d 100644
--- a/docs/datasets-and-plots.html
+++ b/docs/datasets-and-plots.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/how-to-install.html b/docs/how-to-install.html
index 0e2af57..38b4f07 100644
--- a/docs/how-to-install.html
+++ b/docs/how-to-install.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/index.html b/docs/index.html
index 52f6a7c..134f13b 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
@@ -179,7 +185,7 @@ <h1>
 <div id="header">
 <h1 class="title">Getting started with mdatools for R</h1>
 <h4 class="author"><em>Sergey Kucheryavskiy</em></h4>
-<h4 class="date"><em>October 16, 2016</em></h4>
+<h4 class="date"><em>October 30, 2016</em></h4>
 </div>
 <div id="introduction" class="section level1 unnumbered">
 <h1>Introduction</h1>
diff --git a/docs/models-and-results-1.html b/docs/models-and-results-1.html
index eeb8f98..d28b02b 100644
--- a/docs/models-and-results-1.html
+++ b/docs/models-and-results-1.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
@@ -313,7 +319,7 @@ <h3>Model validation</h3>
 <div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r">m2 =<span class="st"> </span><span class="kw">pls</span>(X.c, y.c, <span class="dv">7</span>, <span class="dt">scale =</span> T, <span class="dt">cv =</span> <span class="dv">1</span>, <span class="dt">ncomp.selcrit =</span> <span class="st">&#39;wold&#39;</span>)
 <span class="kw">show</span>(m2$ncomp.selected)</code></pre></div>
 <pre><code>## [1] 4</code></pre>
-<p>And here is the RMSE plots (they are identical of course):</p>
+<p>And here are the RMSE plots (they are identical of course):</p>
 <div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">par</span>(<span class="dt">mfrow =</span> <span class="kw">c</span>(<span class="dv">1</span>, <span class="dv">2</span>))
 <span class="kw">plotRMSE</span>(m1)
 <span class="kw">plotRMSE</span>(m2)</code></pre></div>
@@ -329,7 +335,7 @@ <h3>Model validation</h3>
 ##     X cumexpvar Y cumexpvar  RMSE Slope   Bias  RPD
 ## Cal       97.64       98.19 0.521  0.98  0e+00 7.59
 ## CV        92.90       96.22 0.753  0.98 -2e-04 5.26</code></pre>
-<p>If you want more details run <code>summury()</code> for one of the result objects.</p>
+<p>If you want more details run <code>summary()</code> for one of the result objects.</p>
 <div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">summary</span>(m1$calres)</code></pre></div>
 <pre><code>## 
 ## PLS regression results (class plsres) summary
diff --git a/docs/models-and-results.html b/docs/models-and-results.html
index 644d28c..6f57f4d 100644
--- a/docs/models-and-results.html
+++ b/docs/models-and-results.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/multiclass-classification.html b/docs/multiclass-classification.html
new file mode 100644
index 0000000..fa236ca
--- /dev/null
+++ b/docs/multiclass-classification.html
@@ -0,0 +1,330 @@
+<!DOCTYPE html>
+<html >
+
+<head>
+
+  <meta charset="UTF-8">
+  <meta http-equiv="X-UA-Compatible" content="IE=edge">
+  <title>Getting started with mdatools for R</title>
+  <meta content="text/html; charset=UTF-8" http-equiv="Content-Type">
+  <meta name="description" content="This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect most of the common chemometric methods and give a similar user interface for using them. So if a user knows how to make a model and visualise results for one method, he or she can easily do this for the others.">
+  <meta name="generator" content="bookdown 0.1 and GitBook 2.6.7">
+
+  <meta property="og:title" content="Getting started with mdatools for R" />
+  <meta property="og:type" content="book" />
+  
+  
+  <meta property="og:description" content="This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect most of the common chemometric methods and give a similar user interface for using them. So if a user knows how to make a model and visualise results for one method, he or she can easily do this for the others." />
+  <meta name="github-repo" content="svkucheryavski/mdatools.bookdown" />
+
+  <meta name="twitter:card" content="summary" />
+  <meta name="twitter:title" content="Getting started with mdatools for R" />
+  
+  <meta name="twitter:description" content="This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect most of the common chemometric methods and give a similar user interface for using them. So if a user knows how to make a model and visualise results for one method, he or she can easily do this for the others." />
+  
+
+<meta name="author" content="Sergey Kucheryavskiy">
+
+<meta name="date" content="2016-10-30">
+
+<script type="text/x-mathjax-config">
+MathJax.Hub.Config({
+  TeX: { equationNumbers: { autoNumber: "AMS" } }
+});
+</script>
+
+  <meta name="viewport" content="width=device-width, initial-scale=1">
+  <meta name="apple-mobile-web-app-capable" content="yes">
+  <meta name="apple-mobile-web-app-status-bar-style" content="black">
+  
+  
+<link rel="prev" href="calibration-and-validation.html">
+
+
+<script src="libs/jquery-2.2.3/jquery.min.js"></script>
+<link href="libs/gitbook-2.6.7/css/style.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-bookdown.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-highlight.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-search.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-fontsettings.css" rel="stylesheet" />
+
+
+
+
+
+
+
+
+
+<style type="text/css">
+div.sourceCode { overflow-x: auto; }
+table.sourceCode, tr.sourceCode, td.lineNumbers, td.sourceCode {
+  margin: 0; padding: 0; vertical-align: baseline; border: none; }
+table.sourceCode { width: 100%; line-height: 100%; }
+td.lineNumbers { text-align: right; padding-right: 4px; padding-left: 4px; color: #aaaaaa; border-right: 1px solid #aaaaaa; }
+td.sourceCode { padding-left: 5px; }
+code > span.kw { color: #007020; font-weight: bold; } /* Keyword */
+code > span.dt { color: #902000; } /* DataType */
+code > span.dv { color: #40a070; } /* DecVal */
+code > span.bn { color: #40a070; } /* BaseN */
+code > span.fl { color: #40a070; } /* Float */
+code > span.ch { color: #4070a0; } /* Char */
+code > span.st { color: #4070a0; } /* String */
+code > span.co { color: #60a0b0; font-style: italic; } /* Comment */
+code > span.ot { color: #007020; } /* Other */
+code > span.al { color: #ff0000; font-weight: bold; } /* Alert */
+code > span.fu { color: #06287e; } /* Function */
+code > span.er { color: #ff0000; font-weight: bold; } /* Error */
+code > span.wa { color: #60a0b0; font-weight: bold; font-style: italic; } /* Warning */
+code > span.cn { color: #880000; } /* Constant */
+code > span.sc { color: #4070a0; } /* SpecialChar */
+code > span.vs { color: #4070a0; } /* VerbatimString */
+code > span.ss { color: #bb6688; } /* SpecialString */
+code > span.im { } /* Import */
+code > span.va { color: #19177c; } /* Variable */
+code > span.cf { color: #007020; font-weight: bold; } /* ControlFlow */
+code > span.op { color: #666666; } /* Operator */
+code > span.bu { } /* BuiltIn */
+code > span.ex { } /* Extension */
+code > span.pp { color: #bc7a00; } /* Preprocessor */
+code > span.at { color: #7d9029; } /* Attribute */
+code > span.do { color: #ba2121; font-style: italic; } /* Documentation */
+code > span.an { color: #60a0b0; font-weight: bold; font-style: italic; } /* Annotation */
+code > span.cv { color: #60a0b0; font-weight: bold; font-style: italic; } /* CommentVar */
+code > span.in { color: #60a0b0; font-weight: bold; font-style: italic; } /* Information */
+</style>
+
+</head>
+
+<body>
+
+
+  <div class="book without-animation with-summary font-size-2 font-family-1" data-basepath=".">
+
+    <div class="book-summary">
+      <nav role="navigation">
+
+<ul class="summary">
+<li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
+<li class="chapter" data-level="" data-path="what-mdatools-can-do.html"><a href="what-mdatools-can-do.html"><i class="fa fa-check"></i>What mdatools can do?</a></li>
+<li class="chapter" data-level="" data-path="how-to-install.html"><a href="how-to-install.html"><i class="fa fa-check"></i>How to install</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="datasets-and-plots.html"><a href="datasets-and-plots.html"><i class="fa fa-check"></i>Datasets and plots</a><ul>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html"><i class="fa fa-check"></i>Attributes and factors</a><ul>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#package-specific-attributes"><i class="fa fa-check"></i>Package specific attributes</a></li>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#attributes-for-plots"><i class="fa fa-check"></i>Attributes for plots</a></li>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#special-methods-for-data-transformations"><i class="fa fa-check"></i>Special methods for data transformations</a></li>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#data-frames-with-factors"><i class="fa fa-check"></i>Data frames with factors</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html"><i class="fa fa-check"></i>Simple plots</a><ul>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html#scatter-plots"><i class="fa fa-check"></i>Scatter plots</a></li>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html#line-plots"><i class="fa fa-check"></i>Line plots</a></li>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html#bar-and-errorbar-plots"><i class="fa fa-check"></i>Bar and errorbar plots</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html"><i class="fa fa-check"></i>Plots for groups of objects</a><ul>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html#one-matrix-or-data-frame"><i class="fa fa-check"></i>One matrix or data frame</a></li>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html#list-with-matrices-or-data-frames"><i class="fa fa-check"></i>List with matrices or data frames</a></li>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html#use-factors-to-split-a-dataset-into-groups"><i class="fa fa-check"></i>Use factors to split a dataset into groups</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="working-with-images.html"><a href="working-with-images.html"><i class="fa fa-check"></i>Working with images</a></li>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html"><i class="fa fa-check"></i>Preprocessing</a><ul>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html#autoscaling"><i class="fa fa-check"></i>Autoscaling</a></li>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html#correction-of-spectral-baseline"><i class="fa fa-check"></i>Correction of spectral baseline</a></li>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html#smoothing-and-derivatives"><i class="fa fa-check"></i>Smoothing and derivatives</a></li>
+</ul></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="principal-component-analysis.html"><a href="principal-component-analysis.html"><i class="fa fa-check"></i>Principal component analysis</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results.html"><a href="models-and-results.html"><i class="fa fa-check"></i>Models and results</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results.html"><a href="models-and-results.html#model-calibration"><i class="fa fa-check"></i>Model calibration</a></li>
+<li class="chapter" data-level="" data-path="models-and-results.html"><a href="models-and-results.html#model-validation"><i class="fa fa-check"></i>Model validation</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html"><i class="fa fa-check"></i>Plotting methods</a><ul>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html#support-for-images"><i class="fa fa-check"></i>Support for images</a></li>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html#manual-x-values-for-loading-line-plot"><i class="fa fa-check"></i>Manual x-values for loading line plot</a></li>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html#excluding-rows-and-columns"><i class="fa fa-check"></i>Excluding rows and columns</a></li>
+</ul></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="partial-least-squares-regression.html"><a href="partial-least-squares-regression.html"><i class="fa fa-check"></i>Partial least squares regression</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results-1.html"><a href="models-and-results-1.html"><i class="fa fa-check"></i>Models and results</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results-1.html"><a href="models-and-results-1.html#model-calibration-1"><i class="fa fa-check"></i>Model calibration</a></li>
+<li class="chapter" data-level="" data-path="models-and-results-1.html"><a href="models-and-results-1.html#model-validation-1"><i class="fa fa-check"></i>Model validation</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="plotting-methods-1.html"><a href="plotting-methods-1.html"><i class="fa fa-check"></i>Plotting methods</a><ul>
+<li class="chapter" data-level="" data-path="plotting-methods-1.html"><a href="plotting-methods-1.html#excluding-rows-and-columns-1"><i class="fa fa-check"></i>Excluding rows and columns</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
+</ul>
+
+      </nav>
+    </div>
+
+    <div class="book-body">
+      <div class="body-inner">
+        <div class="book-header" role="navigation">
+          <h1>
+            <i class="fa fa-circle-o-notch fa-spin"></i><a href="./">Getting started with mdatools for R</a>
+          </h1>
+        </div>
+
+        <div class="page-wrapper" tabindex="-1" role="main">
+          <div class="page-inner">
+
+            <section class="normal" id="section-">
+<div id="multiclass-classification" class="section level2 unnumbered">
+<h2>Multiclass classification</h2>
+<p>Several SIMCA models can be combined to a special object <code>simcam</code>, which is used to make a multiclass classification. Besides this, it also allows calculating distance between individual models and a discrimination power — importance of variables to discriminate between any two classes. Let’s see how it works.</p>
+<p>First we create three single-class SIMCA models with individual settings, such as number of optimal components and alpha.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r">m.set =<span class="st"> </span><span class="kw">simca</span>(X.set, <span class="st">&#39;setosa&#39;</span>, <span class="dv">3</span>, <span class="dt">alpha =</span> <span class="fl">0.01</span>)
+m.set =<span class="st"> </span><span class="kw">selectCompNum</span>(m.set, <span class="dv">1</span>)
+
+m.vir =<span class="st"> </span><span class="kw">simca</span>(X.vir, <span class="st">&#39;virginica&#39;</span>, <span class="dv">3</span>)
+m.vir =<span class="st"> </span><span class="kw">selectCompNum</span>(m.vir, <span class="dv">2</span>)
+
+m.ver =<span class="st"> </span><span class="kw">simca</span>(X.ver, <span class="st">&#39;versicola&#39;</span>, <span class="dv">3</span>)
+m.ver =<span class="st"> </span><span class="kw">selectCompNum</span>(m.ver, <span class="dv">1</span>)</code></pre></div>
+<p>Then we combine the models into a SIMCAM model object. Summary will show the performance on calibration set, which is a combination of calibration sets for each of the individual models</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r">m =<span class="st"> </span><span class="kw">simcam</span>(<span class="kw">list</span>(m.set, m.vir, m.ver))
+<span class="kw">summary</span>(m)</code></pre></div>
+<pre><code>## 
+## SIMCA multiple classes classification (class simcam)
+## Nmber of classes: 3
+## Info: 
+## 
+## SIMCA model for class &quot;setosa&quot; summary
+## 
+## Info: 
+## Significance level (alpha): 0.01
+## Selected number of components: 1
+## 
+##        Expvar Cumexpvar Sens (cal)
+## Comp 1  73.51     73.51          1
+## Comp 2  14.24     87.76          1
+## Comp 3  10.44     98.20          1
+## 
+## SIMCA model for class &quot;virginica&quot; summary
+## 
+## Info: 
+## Significance level (alpha): 0.05
+## Selected number of components: 2
+## 
+##        Expvar Cumexpvar Sens (cal)
+## Comp 1  76.16     76.16       0.88
+## Comp 2  14.94     91.10       1.00
+## Comp 3   6.09     97.20       0.96
+## 
+## SIMCA model for class &quot;versicola&quot; summary
+## 
+## Info: 
+## Significance level (alpha): 0.05
+## Selected number of components: 1
+## 
+##        Expvar Cumexpvar Sens (cal)
+## Comp 1  76.44     76.44       0.96
+## Comp 2  13.93     90.37       0.92
+## Comp 3   8.45     98.82       0.92</code></pre>
+<p>Now we apply the combined model to the test set and look at the predictions.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r">res =<span class="st"> </span><span class="kw">predict</span>(m, X.t, c.t)
+<span class="kw">plotPredictions</span>(res)</code></pre></div>
+<p><img src="_main_files/figure-html/unnamed-chunk-95-1.png" width="864" /></p>
+<p>In this case the predictions are shown only for the number of components each model found optimal. The names of classes along y-axis are the individual models. Similarly we can show the predicted values.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">show</span>(res$c.pred[<span class="dv">20</span>:<span class="dv">30</span>, <span class="dv">1</span>, <span class="dv">1</span>:<span class="dv">3</span>])</code></pre></div>
+<pre><code>##    setosa virginica versicola
+## 40      1        -1        -1
+## 42     -1        -1        -1
+## 44      1        -1        -1
+## 46      1        -1        -1
+## 48      1        -1        -1
+## 50      1        -1        -1
+## 52     -1        -1         1
+## 54     -1        -1         1
+## 56     -1         1         1
+## 58     -1        -1        -1
+## 60     -1        -1         1</code></pre>
+<p>There are three additional plots available for multiclass SIMCA model. First of all it is a distance between a selected model and the others.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">par</span>(<span class="dt">mfrow =</span> <span class="kw">c</span>(<span class="dv">1</span>, <span class="dv">2</span>))
+<span class="kw">plotModelDistance</span>(m, <span class="dv">1</span>)
+<span class="kw">plotModelDistance</span>(m, <span class="dv">2</span>)</code></pre></div>
+<p><img src="_main_files/figure-html/unnamed-chunk-97-1.png" width="864" /></p>
+<p>The second plot is a discrimination power, mentioned in the beginning of the section.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">par</span>(<span class="dt">mfrow =</span> <span class="kw">c</span>(<span class="dv">1</span>, <span class="dv">2</span>))
+<span class="kw">plotDiscriminationPower</span>(m, <span class="kw">c</span>(<span class="dv">1</span>, <span class="dv">3</span>), <span class="dt">show.labels =</span> T)
+<span class="kw">plotDiscriminationPower</span>(m, <span class="kw">c</span>(<span class="dv">2</span>, <span class="dv">3</span>), <span class="dt">show.labels =</span> T)</code></pre></div>
+<p><img src="_main_files/figure-html/unnamed-chunk-98-1.png" width="864" /></p>
+<p>And, finally, a Cooman’s plot showing an orthogonal distance from objects to two selected classes/models.</p>
+<div class="sourceCode"><pre class="sourceCode r"><code class="sourceCode r"><span class="kw">par</span>(<span class="dt">mfrow =</span> <span class="kw">c</span>(<span class="dv">1</span>, <span class="dv">2</span>))
+<span class="kw">plotCooman</span>(m, <span class="kw">c</span>(<span class="dv">1</span>, <span class="dv">3</span>), <span class="dt">show.labels =</span> T)
+<span class="kw">plotCooman</span>(m, <span class="kw">c</span>(<span class="dv">2</span>, <span class="dv">3</span>), <span class="dt">show.labels =</span> T)</code></pre></div>
+<p><img src="_main_files/figure-html/unnamed-chunk-99-1.png" width="864" /></p>
+
+</div>
+<!-- </div> -->
+            </section>
+
+          </div>
+        </div>
+      </div>
+<a href="calibration-and-validation.html" class="navigation navigation-prev navigation-unique" aria-label="Previous page"><i class="fa fa-angle-left"></i></a>
+
+
+<script src="libs/gitbook-2.6.7/js/app.min.js"></script>
+<script src="libs/gitbook-2.6.7/js/lunr.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-search.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-sharing.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-fontsettings.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-bookdown.js"></script>
+<script src="libs/gitbook-2.6.7/js/jquery.highlight.js"></script>
+<script>
+require(["gitbook"], function(gitbook) {
+gitbook.start({
+"sharing": {
+"facebook": true,
+"twitter": true,
+"google": false,
+"weibo": false,
+"instapper": false,
+"vk": false,
+"all": ["facebook", "google", "twitter", "weibo", "instapaper"]
+},
+"fontsettings": {
+"theme": "white",
+"family": "sans",
+"size": 1
+},
+"edit": {
+"link": null,
+"text": null
+},
+"download": null,
+"toc": {
+"collapse": "subsection"
+}
+});
+});
+</script>
+
+<!-- dynamically load mathjax for compatibility with self-contained -->
+<script>
+  (function () {
+    var script = document.createElement("script");
+    script.type = "text/javascript";
+    script.src  = "https://cdn.mathjax.org/mathjax/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML";
+    if (location.protocol !== "file:" && /^https?:/.test(script.src))
+      script.src  = script.src.replace(/^https?:/, '');
+    document.getElementsByTagName("head")[0].appendChild(script);
+  })();
+</script>
+</body>
+
+</html>
diff --git a/docs/overview.html b/docs/overview.html
index ce1153d..468a799 100644
--- a/docs/overview.html
+++ b/docs/overview.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/partial-least-squares-regression.html b/docs/partial-least-squares-regression.html
index 6cfb578..e36ae89 100644
--- a/docs/partial-least-squares-regression.html
+++ b/docs/partial-least-squares-regression.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/plots-for-groups-of-objects.html b/docs/plots-for-groups-of-objects.html
index 935be01..b4b5728 100644
--- a/docs/plots-for-groups-of-objects.html
+++ b/docs/plots-for-groups-of-objects.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/plotting-methods-1.html b/docs/plotting-methods-1.html
index 11c04f4..246f7eb 100644
--- a/docs/plotting-methods-1.html
+++ b/docs/plotting-methods-1.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/plotting-methods.html b/docs/plotting-methods.html
index b480575..589c203 100644
--- a/docs/plotting-methods.html
+++ b/docs/plotting-methods.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/preprocessing.html b/docs/preprocessing.html
index f0344a9..cd40cf5 100644
--- a/docs/preprocessing.html
+++ b/docs/preprocessing.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/principal-component-analysis.html b/docs/principal-component-analysis.html
index f5a4b60..e00a5df 100644
--- a/docs/principal-component-analysis.html
+++ b/docs/principal-component-analysis.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/search_index.json b/docs/search_index.json
index 0207df3..d72e67f 100644
--- a/docs/search_index.json
+++ b/docs/search_index.json
@@ -1,6 +1,6 @@
 [
-["index.html", "Getting started with mdatools for R Introduction", " Getting started with mdatools for R Sergey Kucheryavskiy October 16, 2016 Introduction This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect the popular chemometric methods and give a similar “user interface” for using them. So if a user knows how to make a model and visualize results for one method, he or she can easily do this for the other methods as well. I decided to rewrite this tutorial in order to add more details and examples for the implemented methods. This is a pre-release version and I am still working on it. So far it only presents how to work with datasets and plots as well as describes in details how to do PCA analysis and PLS regression. More chapters (classification, interval PLS, etc) will be available soon. You can track main changes in the text here. All methods implemented in the package were tested using well-known datasets. However, there still could be some bugs, in this case please report to svkucheryavski@gmail.com or use Issues tool at GitHub. You are also very welcome to share your comments and suggestions about the package functionality. "],
-["what-is-new.html", "What is new", " What is new What to expect from future releases Book Chapters about classification (SIMCA, SIMCA for multiple classes, PLS-DA) Chapter about interval PLS (iPLS) Chapter about randomization test (randtest) Package Implementation of MCR-ALS and purity based method for curve resolution Possibility to combine preprocessing methods into an object and provide it to a model Randomized algorithms to work with big data faster GUI for interactive modelling Last changes and improvements to book and package 14.10.2016 The new version (0.8.0) brings a lot of new features, therefore it was decided to rewrite this tutorial completely and start this log from the scratch. Most of the things available in the previous version of the package will work without any changes. But if you have been using functions mdaplot() and mdaplotg() it makes sense to read how the new implementation works and rewrite your code. The use of plotting tools became much simpler and more efficient. The main changes in the package are: added a possibility to assign specific attributes to datasets, which makes plotting easier. added a possibility to exclude (hide) selected rows and columns when create a model. if a data frame has factor columns they will be automatically converted to a set of dummy variables. added several functions to make the operations with datasets containing specific attributes easier. plotting tools (mdaplot(), mdaplotg()) were rewritten to make the use of them easier and more efficient scores and loadings plots now show a percent of explained variance biplot is now available for PCA models (plotBiplot) added support for images, see a specific chapter for details cross-validation procedures were optimized for most of the methods and now takes less time several bug fixes and small improvements Besides that, the tutorial is now available in docs folder of the package repository in GitHub. The tutorial is a static HTML site, which can be used locally without internet connection (start with index.html). However, it is not available from CRAN repository due to CRAN limitations. You can also access the tutorial via GitHub Pages "],
+["index.html", "Getting started with mdatools for R Introduction", " Getting started with mdatools for R Sergey Kucheryavskiy October 30, 2016 Introduction This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect the popular chemometric methods and give a similar “user interface” for using them. So if a user knows how to make a model and visualize results for one method, he or she can easily do this for the other methods as well. I decided to rewrite this tutorial in order to add more details and examples for the implemented methods. This is a pre-release version and I am still working on it. So far it only presents how to work with datasets and plots as well as describes in details how to do PCA analysis and PLS regression. More chapters (classification, interval PLS, etc) will be available soon. You can track main changes in the text here. All methods implemented in the package were tested using well-known datasets. However, there still could be some bugs, in this case please report to svkucheryavski@gmail.com or use Issues tool at GitHub. You are also very welcome to share your comments and suggestions about the package functionality. "],
+["what-is-new.html", "What is new", " What is new What expect from future releases Book Chapters about classification (SIMCA, SIMCA for multiple classes, PLS-DA) Chapter about interval PLS (iPLS) Chapter about randomization test (randtest) Package Implementation of MCR-ALS and purity based method for curve resolution Possibility to combine preprocessing methods into an object and provide it to a model Randomized algorithms to work with big data faster GUI for interactive modelling Last changes and improvements to book and package 30.10.2016 fixed a bug in PCA when explained variance was calculated incorrectly for data with excluded rows fixed several issues with SIMCA (cross-validation) and SIMCAM (Cooman’s plot) added a chapter about SIMCA to the tutorial 14.10.2016 The new version (0.8.0) brings a lot of new features, therefore it was decided to rewrite this tutorial completely and start this log from the scratch. Most of the things available in the previous version of the package will work without any changes. But if you have been using functions mdaplot() and mdaplotg() it makes sense to read how the new implementation works and rewrite your code. The use of plotting tools became much simpler and more efficient. The main changes in the package are: added a possibility to assign specific attributes to datasets, which makes plotting easier. added a possibility to exclude (hide) selected rows and columns when create a model. if a data frame has factor columns they will be automatically converted to a set of dummy variables. added several functions to make the operations with datasets containing specific attributes easier. plotting tools (mdaplot(), mdaplotg()) were rewritten to make the use of them easier and more efficient scores and loadings plots now show a percent of explained variance biplot is now available for PCA models (plotBiplot) added support for images, see a specific chapter for details cross-validation procedures were optimized for most of the methods and now takes less time several bug fixes and small improvements Besides that, the tutorial is now available in docs folder of the package repository in GitHub. The tutorial is a static HTML site, which can be used locally without internet connection (start with index.html). However, it is not available from CRAN repository due to CRAN limitations. You can also access the tutorial via GitHub Pages "],
 ["overview.html", "Overview", " Overview This package was created for an introductory PhD course on Chemometrics given at Department of Chemistry and Bioscience, Aalborg University. Quickly I found out that using R for this course (with all advantages it gives) needs a lot of routine work from students, since most of them were also beginners in R. Of course it is very good for understanding when students get to know e.g. how to calculate explained variance or residuals in PCA manually or make corresponding plots and so on, but for the introductory course these things (as well as numerous typos and small mistakes in a code) take too much time, which can be spent for explaining methods and proper interpretation of results. This is actually also true for everyday using of these methods, most of the routines can be written ones and simply reused with various options. So it was decided to write a package where most widely used chemometric methods for multivariate data analysis are implemented and which gives also a quick and easy-to-use access to results, produced by these methods. First of all numerous plots. Here how it works. Say, we need to make a PCA model for data matrix x with autoscaling. Then make an overview of most important plots and investigate scores and loadings for first three components. The mdatools solution will be: # make a model for autoscaled data with maximum possible number of components m = pca(x, scale = TRUE) # show explained variance plot plotVariance(m) # select optimal number of components (say, 4) for correct calculation of residuals m = selectCompNum(m, 4) # show plots for model overview plot(m) # show scores plot for PC1 and PC3 plotScores(m, c(1, 3)) # show loadings plot for the same components plotLoadings(m, c(1, 3)) # show the loadings as a set of bar plots plotLoadings(m, c(1, 3), type = &#39;h&#39;) Fairly simple, is not it? The other “routine”, which have been taken into account is validation — any model can be cross-validated or validated with a test set. The model object will contain the validation results, which will also appear on all model plots, etc. See the next chapters for details. "],
 ["what-mdatools-can-do.html", "What mdatools can do?", " What mdatools can do? The package includes classes and functions for analysis, preprocessing and plotting data and results. So far the following methods for analysis are implemented: Principal Component Analysis (PCA) Soft Independent Modelling of Class Analogy (SIMCA) Partial Least Squares regression (PLS) with calculation of VIP scores and Selectivity ratio Partial Least Squares Discriminant Analysis (PLS-DA) Randomization test for PLS regression models Interval PLS for variable selection Preprocessing methods include: Mean centering, standardization and autoscaling Savitzky-Golay filter for smoothing and derivatives Standard Normal Variate for removing scatter effect from spectral data Mutliplicative Scatter Correction for the same issue Normalization of spectra to unit area or unit length Besides that, some extensions for the basic R plotting functionality have been also implemented and allow to do the following: Color grouping of objects with automatic color legend bar. Plot for several groups of objects with automatically calculated axes limits and plot legend. Three built-in color schemes — one is based on Colorbrewer and the other two are jet and grayscale. Very easy-to-use possibility to apply any user defined color scheme. Possibility to show horizontal and vertical lines on the plot with automatically adjusted axes limits. Possibility to extend plotting functionality by using some attributes for datasets. See ?mdatools and next chapters for more details. "],
 ["how-to-install.html", "How to install", " How to install The package is available from CRAN by usual installing procedure. However due to restrictions in CRAN politics regarding number of submissions (once in 3-4 month) only major releases will be published there. To get the latest release plase use GitHub sources. You can either download a zip-file with the source package and install it using the install.packages command, e.g. if the downloaded file is mdatools_0.8.0.tar.gz and it is located in a current working directory, just run the following: install.packages(&#39;mdatools_0.8.0.tar.gz&#39;) If you have devtools package installed, the following command will install the latest release from the GitHub (do not forget to load the devtools package first): install_github(&#39;svkucheryavski/mdatools&#39;) -->"],
@@ -14,7 +14,10 @@
 ["models-and-results.html", "Models and results", " Models and results In mdatools, any method for data analysis, such as PCA, PLS regression, SIMCA classification and so on, can create two types of objects — a model and a result. Every time you build a model you get a model object. Every time you apply the model to a dataset you get a result object. Thus for PCA, the objects have classes pca and pcares correspondingly. Each object includes a list with variables (e.g. loadings for model, scores and explained variance for result) and provides a number of methods for investigation. Model calibration Let’s see how this works using a simple example — People data. We used this data when was playing with plots, it consists of 32 objects (persons from Scandinavian and Mediterranean countries, 16 male and 16 female) and 12 variables (height, weight, shoesize, annual income, beer and wine consumption and so on.). More information about the data can be found using ?people. We will first load the data matrix and split it into two subsets as following: library(mdatools) data(people) idx = seq(4, 32, 4) X.c = people[-idx, ] X.t = people[idx, ] So X.c is our calibration subset we are going to use for creating a PCA model and X.t is a subset we will apply the calibrated model to. Now let’s calibrate the model and show an information about the model object: m = pca(X.c, 7, scale = T, info = &quot;People PCA model&quot;) m = selectCompNum(m, 5) Here pca is a function that builds (calibrates) a PCA model and returns the model object. Function selectCompNum allows to select an “optimal” number of components for the model. In our case we calibrate model with 7 principal components (second argument for the function pca()) however, e.g. after investigation of explained variance we found out that 5 components is optimal. In this case we have two choices. Either recalibrate the model using 5 components or use the model that is calibrated already but “tell” the model that 5 components is the optimal number. In this case the model will keep all results calculated for 10 components but will use optimal number of components when necessary. For example when showing residuals plot for the model. Or when PCA model is used in SIMCA classification. Finally, function print prints the model object info: print(m) ## ## PCA model (class pca) ## ## ## Call: ## pca(x = X.c, ncomp = 7, scale = T, info = &quot;People PCA model&quot;) ## ## Major fields: ## $loadings - matrix with loadings ## $eigenvals - eigenvalues for components ## $ncomp - number of calculated components ## $ncomp.selected - number of selected components ## $center - values for centering data ## $scale - values for scaling data ## $cv - number of segments for cross-validation ## $alpha - significance level for Q residuals ## $calres - results (scores, etc) for calibration set As you can see there are no scores, explained variance values, residuals and so on. Because they actually are not part of a PCA model, they are results of applying the model to a calibration set. But loadings, eigenvalues, number of calculated and selected principal components, vectors for centering and scaling the data, number of segments for cross-validation (if used) and significance levels are the model fields: m$loadings[1:4, 1:4] ## Comp 1 Comp 2 Comp 3 Comp 4 ## Height -0.3792846 0.08004057 -0.06676611 0.04512380 ## Weight -0.3817929 0.08533809 -0.08527883 -0.04051629 ## Hairleng 0.3513874 -0.22676635 -0.02273504 0.01575716 ## Shoesize -0.3776985 0.12503739 -0.02117369 0.09929010 One can also notice that the model object has a particular field — calres, which is in fact a PCA result object containing results of applying the model to the calibration set. If we look at the object description we will get the following: print(m$calres) ## ## Results for PCA decomposition (class pcares) ## ## Major fields: ## $scores - matrix with score values ## $T2 - matrix with T2 distances ## $Q - matrix with Q residuals ## $ncomp.selected - selected number of components ## $expvar - explained variance for each component ## $cumexpvar - cumulative explained variance And if we want to look at scores, here is the way: m$calres$scores[1:4, 1:4] ## Comp 1 Comp 2 Comp 3 Comp 4 ## Lars -5.108742 -1.2714943 1.0765871 1.08910438 ## Peter -3.021811 -0.3163758 -0.2958259 -1.36053121 ## Rasmus -2.887335 -0.4428721 0.1231706 -1.15070563 ## Mette 1.116457 -1.3716444 -1.6344512 -0.03803356 Both model and result objects also have related functions (methods), first of all for visualizing various values (e.g. scores plot, loadings plot, etc.). Some of the functions will be discussed later in this chapter, a full list can be found in help for a proper method. The result object is also created every time you apply a model to a new data. Like in many built-in R methods, method predict() is used in this case. The first argument of the method is always a model object. Here is a PCA example (assuming we have already built the model): res = predict(m, X.t) print(res) ## ## Results for PCA decomposition (class pcares) ## ## Major fields: ## $scores - matrix with score values ## $T2 - matrix with T2 distances ## $Q - matrix with Q residuals ## $ncomp.selected - selected number of components ## $expvar - explained variance for each component ## $cumexpvar - cumulative explained variance Model validation Any model can be validated with cross-validation or/and test set validation. The validation results are, of course, represented by result objects, which are fields of a model object similar to calres, but with names cvres and testres correspondingly. Here is how to build a PCA model with full cross-validation and test set validation (we will use X.t as test data) at the same time: m = pca(X.c, 7, scale = T, cv = 1, x.test = X.t, info = &quot;PCA model&quot;) m = selectCompNum(m, 5) Parameter cv specifies options for cross-validation. If a numeric value is provided then it will be used as number of segments for random cross-validation, e.g. if cv = 2 cross-validation with two segments will be used. For full cross-validation use cv = 1 like we did in the example above (this is perhaps a bit misleading, but I keep this option for compatability). For more advanced option you can provide a list with name of cross-validation method, number of segments and number of iterations, e.g. cv = list('rand', 4, 4) for running random cross-validation with four segments and four repetitions. And here is the model object info: print(m) ## ## PCA model (class pca) ## ## ## Call: ## pca(x = X.c, ncomp = 7, scale = T, cv = 1, x.test = X.t, info = &quot;PCA model&quot;) ## ## Major fields: ## $loadings - matrix with loadings ## $eigenvals - eigenvalues for components ## $ncomp - number of calculated components ## $ncomp.selected - number of selected components ## $center - values for centering data ## $scale - values for scaling data ## $cv - number of segments for cross-validation ## $alpha - significance level for Q residuals ## $calres - results (scores, etc) for calibration set ## $cvres - results for cross-validation ## $testres - results for test set As you can see we have all three types of results now — calibration (calres), cross-validation (cvres) and test set validation (testres). Let us compare, for example, the explained variance values for the results: var = data.frame(cal = m$calres$expvar, cv = m$cvres$expvar, test = m$testres$expvar) show(round(var, 1)) ## cal cv test ## Comp 1 54.2 43.1 44.8 ## Comp 2 20.3 21.2 17.2 ## Comp 3 13.1 14.7 17.0 ## Comp 4 7.9 13.0 8.0 ## Comp 5 2.3 3.6 4.4 ## Comp 6 1.1 2.0 2.4 ## Comp 7 0.5 0.8 0.7 Every model and every result has a method summary(), which shows some statistics for evaluation of a model performance. Here are some examples. summary(m) ## ## PCA model (class pca) summary ## ## Info: ## PCA model ## ## Eigvals Expvar Cumexpvar ## Comp 1 6.509 54.24 54.24 ## Comp 2 2.434 20.28 74.52 ## Comp 3 1.572 13.10 87.62 ## Comp 4 0.946 7.88 95.51 ## Comp 5 0.272 2.27 97.77 ## Comp 6 0.137 1.14 98.92 ## Comp 7 0.058 0.48 99.39 summary(m$calres) ## ## Summary for PCA results ## ## Selected components: 5 ## ## Expvar Cumexpvar ## Comp 1 54.24 54.24 ## Comp 2 20.28 74.52 ## Comp 3 13.10 87.62 ## Comp 4 7.88 95.51 ## Comp 5 2.27 97.77 ## Comp 6 1.14 98.92 ## Comp 7 0.48 99.39 The same methodology is used for any other method, e.g. PLS or SIMCA. In the next section we will look at how to use plotting functions for models and results. "],
 ["plotting-methods.html", "Plotting methods", " Plotting methods First of all you can use the methods mdaplot() and mdaplotg() (or any others, e.g. ggplot2) for easy visualisation the results as they all available as matrices with proper names, attributes, etc. In the example below we create several scores and loadings plots. Here I assume that the last model you have created was the one with test set and cross-validation. par(mfrow = c(1, 2)) mdaplot(m$calres$scores, type = &#39;p&#39;, show.labels = T, show.lines = c(0, 0)) mdaplot(m$loadings, type = &#39;p&#39;, show.labels = T, show.lines = c(0, 0)) To simplify this routine, every model and result class also has a number of functions for visualization. Thus for PCA the function list includes scores and loadings plots, explained variance and cumulative explained variance plots, T2 vs. Q residuals and many others. A function that does the same for different models and results has always the same name. For example plotPredictions will show predicted vs. measured plot for PLS model and PLS result, MLR model and MLR result, PCR model and PCR result and so on. The first argument must always be either a model or a result object. The major difference between plots for model and plots for result is following. A plot for result always shows one set of data objects — one set of points, lines or bars. For example predicted vs. measured values for calibration set or scores values for test set and so on. For such plots method mdaplot() is used and you can provide any arguments, available for this method (e.g. color group scores for calibration results). And a plot for a model in most cases shows several sets of data objects, e.g. predicted values for calibration and validation. In this case, a corresponding method uses mdaplotg() and therefore you can adjust the plot using arguments described for this method. Here are some examples for results: par(mfrow = c(2, 2)) plotScores(m$calres, show.labels = T) plotScores(m$calres, c(1, 3), pch = 18, cgroup = X.c[, &#39;Income&#39;], show.labels = T, labels = &#39;indices&#39;) plotResiduals(m$calres, show.labels = T, cgroup = X.c[, &#39;Weight&#39;]) plotVariance(m$calres, type = &#39;h&#39;, show.labels = T, labels = &#39;values&#39;) The color grouping option is not available for the group (model) plots as colors are used there to underline the groups. Now let’s look at similar plots (plus loadings) for a model. par(mfrow = c(2, 2)) plotScores(m, c(1, 3), show.labels = T) plotLoadings(m, c(1, 3), show.labels = T) plotResiduals(m, col = c(&#39;red&#39;, &#39;green&#39;, &#39;blue&#39;)) plotVariance(m, type = &#39;h&#39;, show.labels = T, labels = &#39;values&#39;) Method plot() shows the main four PCA plots as a model (or results) overview. plot(m, show.labels = T) You do not have to care about labels, names, legend and so on, however if necessary you can always change almost anything. See full list of methods available for PCA by ?pca and ?pcares. Support for images As it was described before, images can be used as a source of data for any methods. In this case the results, related to objects/pixels will inherit all necessary attributes and can be show as images as well. In the example below we make a PCA model for the image data from the package and show scores and residuals. data(pellets) X = mda.im2data(pellets) m = pca(X) par(mfrow = c(2, 2)) imshow(m$calres$scores) imshow(m$calres$Q) imshow(m$calres$scores, 2) imshow(m$calres$Q, 2) Manual x-values for loading line plot As it was discussed in the previous chapter, you can specify a special attribute, 'xaxis.values' to a dataset, which will be used as manual x-values in bar and line plots. When we create any model and/or results the most important attributes, including this one, are inherited. For example when you make a loading line plot it will be shown using the attribute values. data(simdata) X = simdata$spectra.c attr(X, &#39;xaxis.name&#39;) = &#39;Wavelength, nm&#39; attr(X, &#39;xaxis.values&#39;) = simdata$wavelength m = pca(X, 3) plotLoadings(m, 1:3, type = &#39;l&#39;) Excluding rows and columns From v. 0.8.0 PCA implementation as well as any other method in mdatools can exclude rows and columns from calculations. For example it can be useful if you have some candidates for outliers or do variable selection and do not want to remove rows and columns physically from the data matrix. In this case you can just specify two additional parameters, exclcols and exclrows, using either numbers or names of rows/columns to be excluded. You can also specify a vector with logical values (all TRUEs will be excluded). The excluded rows are not used for creating a model and calculaiton of model’s and results’ performance (e.g. explained variance). However main results (for PCA — scores and residuals) are calculated for these rows as well and set hidden, so you will not see them on plots. You can always e.g. show scores for excluded objects by using show.excluded = TRUE. It is implemented via attributes “known” for plotting methods from mdatools so if you use e.g. ggplot2 you will see all points. The excluded columns are not used for any calculations either, the corresponding results (e.g. loadings or regression coefficients) will have zero values for such columns and be also hidden on plots. Here is a simple example. data(people) m = pca(people, 5, scale = T, exclrows = c(&#39;Lars&#39;, &#39;Federico&#39;), exclcols = &#39;Income&#39;) par(mfrow = c(2, 2)) plotScores(m, show.labels = T) plotScores(m, show.excluded = T, show.labels = T) plotResiduals(m, show.excluded = T, show.labels = T) plotLoadings(m, show.excluded = T, show.labels = T) # show matrix with loadings (look at row Income and attribute &quot;exclrows&quot;) show(m$loadings) ## Comp 1 Comp 2 Comp 3 Comp 4 Comp 5 ## Height -0.386393327 0.10697019 -0.004829174 0.12693029 -0.13128331 ## Weight -0.391013398 0.07820097 0.051916032 0.04049593 -0.14757465 ## Hairleng 0.350435073 -0.11623295 -0.103852349 -0.04969503 -0.73669997 ## Shoesize -0.385424793 0.13805817 -0.069172117 0.01049098 -0.17075488 ## Age -0.103466285 0.18964288 -0.337243182 -0.89254403 -0.02998028 ## Income 0.000000000 0.00000000 0.000000000 0.00000000 0.00000000 ## Beer -0.317356319 -0.38259695 0.044338872 -0.03908064 -0.21419831 ## Wine 0.140711271 0.57861817 -0.059833970 0.12347379 -0.41488773 ## Sex 0.364537185 -0.23838610 0.010818891 0.04025631 -0.18263577 ## Swim -0.377470722 0.04330411 0.008151288 0.18149268 -0.30163601 ## Region 0.140581701 0.60435183 0.040969200 0.15147464 0.17857614 ## IQ 0.009849911 0.09372132 0.927669306 -0.32978247 -0.11815762 ## attr(,&quot;exclrows&quot;) ## [1] 6 ## attr(,&quot;name&quot;) ## [1] &quot;Loadings&quot; ## attr(,&quot;xaxis.name&quot;) ## [1] &quot;Components&quot; Such behavior will help to exclude and include rows and columns interactively, when GUI add-in for mdatools() is available. -->"],
 ["partial-least-squares-regression.html", "Partial least squares regression", " Partial least squares regression Partial least squares regression is a linear regression method, which uses principles similar to PCA: data is decomposed using latent variables. Because in this case we have two datasets, predictors (\\(X\\)) and responses (\\(Y\\)) we do decomposition for both, computing scores, loadings and residuals: \\(X = TP^T + E_x\\), \\(Y = UQ^T + E_y\\). In addition to that, orientation of latent variables in PLS is selected to maximize the covariance between the X-scores, \\(T\\), and Y-scores \\(U\\). This approach makes possible to work with datasets where more traditional Multiple Linear Regression fails — when number of variables exceeds number of observations and when X-variables are mutually correlated. But at the end PLS-model is a linear model, where response value is a linear combination of predictors, so the main outcome is a vector with regression coefficients. There are two main algorithms for PLS, NIPALS and SIMPLS, in the mdatools only the last one is implemented. PLS model and PLS results objects have a lot of components and performance statistics, which can be visualised via plots. Besides that the implemented pls() method calculates selectivity ratio and VIP scores, which can be used for selection of most important variables. We will discuss most of the methods in this chapter and you can get the full list using ?pls. "],
-["models-and-results-1.html", "Models and results", " Models and results Like we discussed in PCA, matools creates two types of objects — a model and a result. Every time you build a PLS model you get a model object. Every time you apply the model to a dataset you get a result object. For PLS, the objects have classes pls and plsres correspondingly. Model calibration Let’s use the same People data and create a PLS-model for prediction of Shoesize (column number four) using other 11 variables as predictors. As usual, we start with preparing datasets (we will also split the data into calibration and test subsets): library(mdatools) data(people) idx = seq(4, 32, 4) X.c = people[-idx, -4] y.c = people[-idx, 4, drop = F] X.t = people[idx, -4] y.t = people[idx, 4, drop = F] So X.c and y.c are predictors and response values for calibration subset. Now let’s calibrate the model and show an information about the model object: m = pls(X.c, y.c, 7, scale = T, info = &quot;Shoesize prediction model&quot;) ## Warning in selectCompNum.pls(model): No validation results were found! m = selectCompNum(m, 3) As you can see, the procedure is very similar to PCA, here we use 7 latent variables and select 3 first as an optimal number. Here is an info for the model object: print(m) ## ## PLS model (class pls) ## ## Call: ## pls.cal(x = x, y = y, ncomp = ncomp, center = center, scale = scale, ## method = method, cv = cv, alpha = alpha, coeffs.ci = coeffs.ci, ## coeffs.alpha = coeffs.alpha, info = info, light = light, ## exclcols = exclcols, exclrows = exclrows, ncomp.selcrit = ncomp.selcrit) ## ## Major fields: ## $ncomp - number of calculated components ## $ncomp.selected - number of selected components ## $coeffs - object (regcoeffs) with regression coefficients ## $xloadings - vector with x loadings ## $yloadings - vector with y loadings ## $weights - vector with weights ## $calres - results for calibration set ## ## Try summary(model) and plot(model) to see the model performance. As expected, we see loadings for predictors and responses, matrix with weights, and a special object (regcoeffs) for regression coefficients. The values for regression coefficients are available in m.regcoeffs.values, it is an array with dimension nVariables x nComponents x nPredictors. The reason to use the object instead of just an array is mainly for being able to get and plot regression coefficients for different methods. Besides that, it is possible to calculate confidence intervals and other statistics for the coefficients using Jack-Knife method (will be shown later), which produces extra entities. The regression coefficients can be shown as plot using either function plotRegcoeffs() for the PLS model object or function plot() for the object with regression coefficients. You need to specify for which predictor (if you have more than one y-variable) and which number of components you want to see the coefficients for. By default it shows values for the optimal number of components and first y-variable as it is shown on example below. par(mfrow = c(2, 2)) plotRegcoeffs(m) plotRegcoeffs(m, ncomp = 2) plot(m$coeffs, ncomp = 3, type = &#39;h&#39;, show.labels = T) plot(m$coeffs, ncomp = 2) The model keeps regression coefficients, calculated for centered and standardized data, without intercept, etc. Here are the values for three PLS components. show(m$coeffs$values[, 3, 1]) ## Height Weight Hairleng Age Income ## 0.210411676 0.197646483 -0.138824482 0.026613035 -0.000590693 ## Beer Wine Sex Swim Region ## 0.148917913 0.138138095 -0.138824482 0.223962000 0.010392542 ## IQ ## -0.088658626 You can get the corrected coefficients, which can be applied directly to the raw data, by using method getRegcoeffs(): show(getRegcoeffs(m, ncomp = 3)) ## Shoesize ## Intercept 1.251537e+01 ## Height 8.105287e-02 ## Weight 5.110732e-02 ## Hairleng -5.375404e-01 ## Age 1.147785e-02 ## Income -2.580586e-07 ## Beer 6.521476e-03 ## Wine 1.253340e-02 ## Sex -5.375404e-01 ## Swim 1.164947e-01 ## Region 4.024083e-02 ## IQ -2.742712e-02 Similar to PCA, model object may contain three fields for results obtained using calibration set (calres), cross-validation (cvres) and test set validation (testres). All three have class plsres, here is how calres looks like: print(m$calres) ## ## PLS results (class plsres) ## ## Call: ## plsres(y.pred = yp, y.ref = y.ref, ncomp.selected = object$ncomp.selected, ## xdecomp = xdecomp, ydecomp = ydecomp) ## ## Major fields: ## $ncomp.selected - number of selected components ## $yp - array with predicted y values ## $y - matrix with reference y values ## $rmse - root mean squared error ## $r2 - coefficient of determination ## $slope - slope for predicted vs. measured values ## $bias - bias for prediction vs. measured values ## $ydecomp - decomposition of y values (ldecomp object) ## $xdecomp - decomposition of x values (ldecomp object) The xdecomp and ydecomp are objects similar to pcares, they contain scores, residuals and variances for decomposition of X and Y correspondingly. print(m$calres$xdecomp) ## ## Results of data decomposition (class ldecomp) ## ## Major fields: ## $scores - matrix with score values ## $T2 - matrix with T2 distances ## $Q - matrix with Q residuals ## $ncomp.selected - selected number of components ## $expvar - explained variance for each component ## $cumexpvar - cumulative explained variance Other fields are mostly various performance statistics, including slope, coefficient of determination (R2), bias, and root mean squared error (RMSE). Besides that, the results also include reference y-values and array with predicted y-values. The array has dimension nObjects x nComponents x nResponses. PLS predictions for a new set can be obtained using method predict: res = predict(m, X.t, y.t) print(res) ## ## PLS results (class plsres) ## ## Call: ## plsres(y.pred = yp, y.ref = y.ref, ncomp.selected = object$ncomp.selected, ## xdecomp = xdecomp, ydecomp = ydecomp) ## ## Major fields: ## $ncomp.selected - number of selected components ## $yp - array with predicted y values ## $y - matrix with reference y values ## $rmse - root mean squared error ## $r2 - coefficient of determination ## $slope - slope for predicted vs. measured values ## $bias - bias for prediction vs. measured values ## $ydecomp - decomposition of y values (ldecomp object) ## $xdecomp - decomposition of x values (ldecomp object) Model validation Validation is implemented similar to PCA, the only difference is that you need to provide two datasets for a test set — one for predictors (x.test) and one for response (y.test) values. Cross-validation is very important for PLS as it helps to find optimal number of PLS components (so test set performance is more fair as in this case you do not use test set for optimization). Therefore, it is always recommended to use cross-validation. You probably have noticed a small warning we got when created the first PLS model in this chapter: m = pls(X.c, y.c, 7, scale = T, info = &quot;Shoesize prediction model&quot;) ## Warning in selectCompNum.pls(model): No validation results were found! When you create a model, it tries to select optimal number of components automatically (which, of course, you can always change later). To do that, the method uses RMSE values, calculated for different number of components and cross-validation predictions. So, if we do not use cross-validation, it warns use about this. There are two different ways/criteria for automatic selection. One is using first local minimum on the RMSE plot and second is so called Wold criterion, based on a ratio between PRESS values for current and next component. You can select which criterion to use by specifying parameter ncomp.selcrit (either 'min' or 'wold') as it is shown below. m1 = pls(X.c, y.c, 7, scale = T, cv = 1, ncomp.selcrit = &#39;min&#39;) show(m1$ncomp.selected) ## [1] 5 m2 = pls(X.c, y.c, 7, scale = T, cv = 1, ncomp.selcrit = &#39;wold&#39;) show(m2$ncomp.selected) ## [1] 4 And here is the RMSE plots (they are identical of course): par(mfrow = c(1, 2)) plotRMSE(m1) plotRMSE(m2) Parameter cv has the same format as for PCA. If it is a number, it will be used as number of segments for random cross-validation, e.g. if cv = 2 cross-validation with two segments will be carried out. For full cross-validation use cv = 1 like we did in the example above. For more advanced option you can provide a list with name of cross-validation method, number of segments and number of iterations, e.g. cv = list('rand', 4, 4) for running random cross-validation with four segments and four repetitions or cv = list('ven', 8) for systematic split into eight segments (venetian blinds). Method summary() for model shows performance statistics calculated using optimal number of components for each of the results. summary(m1) ## ## PLS model (class pls) summary ## ## Performance and validation: ## Number of selected components: 5 ## X cumexpvar Y cumexpvar RMSE Slope Bias RPD ## Cal 97.64 98.19 0.521 0.98 0e+00 7.59 ## CV 92.90 96.22 0.753 0.98 -2e-04 5.26 If you want more details run summury() for one of the result objects. summary(m1$calres) ## ## PLS regression results (class plsres) summary ## ## Response variable Shoesize: ## X expvar X cumexpvar Y expvar Y cumexpvar RMSE Slope Bias RPD ## Comp 1 50.505 50.505 93.779 93.779 0.966 0.938 0 4.1 ## Comp 2 20.979 71.484 2.926 96.705 0.703 0.967 0 5.6 ## Comp 3 8.667 80.151 0.917 97.622 0.597 0.976 0 6.6 ## Comp 4 5.847 85.998 0.479 98.101 0.534 0.981 0 7.4 ## Comp 5 11.642 97.640 0.088 98.189 0.521 0.982 0 7.6 ## Comp 6 0.495 98.135 0.347 98.536 0.468 0.985 0 8.4 ## Comp 7 0.442 98.577 0.202 98.738 0.435 0.987 0 9.1 There is no column for R2 as Y cumexpvar values are the same. "],
+["models-and-results-1.html", "Models and results", " Models and results Like we discussed in PCA, matools creates two types of objects — a model and a result. Every time you build a PLS model you get a model object. Every time you apply the model to a dataset you get a result object. For PLS, the objects have classes pls and plsres correspondingly. Model calibration Let’s use the same People data and create a PLS-model for prediction of Shoesize (column number four) using other 11 variables as predictors. As usual, we start with preparing datasets (we will also split the data into calibration and test subsets): library(mdatools) data(people) idx = seq(4, 32, 4) X.c = people[-idx, -4] y.c = people[-idx, 4, drop = F] X.t = people[idx, -4] y.t = people[idx, 4, drop = F] So X.c and y.c are predictors and response values for calibration subset. Now let’s calibrate the model and show an information about the model object: m = pls(X.c, y.c, 7, scale = T, info = &quot;Shoesize prediction model&quot;) ## Warning in selectCompNum.pls(model): No validation results were found! m = selectCompNum(m, 3) As you can see, the procedure is very similar to PCA, here we use 7 latent variables and select 3 first as an optimal number. Here is an info for the model object: print(m) ## ## PLS model (class pls) ## ## Call: ## pls.cal(x = x, y = y, ncomp = ncomp, center = center, scale = scale, ## method = method, cv = cv, alpha = alpha, coeffs.ci = coeffs.ci, ## coeffs.alpha = coeffs.alpha, info = info, light = light, ## exclcols = exclcols, exclrows = exclrows, ncomp.selcrit = ncomp.selcrit) ## ## Major fields: ## $ncomp - number of calculated components ## $ncomp.selected - number of selected components ## $coeffs - object (regcoeffs) with regression coefficients ## $xloadings - vector with x loadings ## $yloadings - vector with y loadings ## $weights - vector with weights ## $calres - results for calibration set ## ## Try summary(model) and plot(model) to see the model performance. As expected, we see loadings for predictors and responses, matrix with weights, and a special object (regcoeffs) for regression coefficients. The values for regression coefficients are available in m.regcoeffs.values, it is an array with dimension nVariables x nComponents x nPredictors. The reason to use the object instead of just an array is mainly for being able to get and plot regression coefficients for different methods. Besides that, it is possible to calculate confidence intervals and other statistics for the coefficients using Jack-Knife method (will be shown later), which produces extra entities. The regression coefficients can be shown as plot using either function plotRegcoeffs() for the PLS model object or function plot() for the object with regression coefficients. You need to specify for which predictor (if you have more than one y-variable) and which number of components you want to see the coefficients for. By default it shows values for the optimal number of components and first y-variable as it is shown on example below. par(mfrow = c(2, 2)) plotRegcoeffs(m) plotRegcoeffs(m, ncomp = 2) plot(m$coeffs, ncomp = 3, type = &#39;h&#39;, show.labels = T) plot(m$coeffs, ncomp = 2) The model keeps regression coefficients, calculated for centered and standardized data, without intercept, etc. Here are the values for three PLS components. show(m$coeffs$values[, 3, 1]) ## Height Weight Hairleng Age Income ## 0.210411676 0.197646483 -0.138824482 0.026613035 -0.000590693 ## Beer Wine Sex Swim Region ## 0.148917913 0.138138095 -0.138824482 0.223962000 0.010392542 ## IQ ## -0.088658626 You can get the corrected coefficients, which can be applied directly to the raw data, by using method getRegcoeffs(): show(getRegcoeffs(m, ncomp = 3)) ## Shoesize ## Intercept 1.251537e+01 ## Height 8.105287e-02 ## Weight 5.110732e-02 ## Hairleng -5.375404e-01 ## Age 1.147785e-02 ## Income -2.580586e-07 ## Beer 6.521476e-03 ## Wine 1.253340e-02 ## Sex -5.375404e-01 ## Swim 1.164947e-01 ## Region 4.024083e-02 ## IQ -2.742712e-02 Similar to PCA, model object may contain three fields for results obtained using calibration set (calres), cross-validation (cvres) and test set validation (testres). All three have class plsres, here is how calres looks like: print(m$calres) ## ## PLS results (class plsres) ## ## Call: ## plsres(y.pred = yp, y.ref = y.ref, ncomp.selected = object$ncomp.selected, ## xdecomp = xdecomp, ydecomp = ydecomp) ## ## Major fields: ## $ncomp.selected - number of selected components ## $yp - array with predicted y values ## $y - matrix with reference y values ## $rmse - root mean squared error ## $r2 - coefficient of determination ## $slope - slope for predicted vs. measured values ## $bias - bias for prediction vs. measured values ## $ydecomp - decomposition of y values (ldecomp object) ## $xdecomp - decomposition of x values (ldecomp object) The xdecomp and ydecomp are objects similar to pcares, they contain scores, residuals and variances for decomposition of X and Y correspondingly. print(m$calres$xdecomp) ## ## Results of data decomposition (class ldecomp) ## ## Major fields: ## $scores - matrix with score values ## $T2 - matrix with T2 distances ## $Q - matrix with Q residuals ## $ncomp.selected - selected number of components ## $expvar - explained variance for each component ## $cumexpvar - cumulative explained variance Other fields are mostly various performance statistics, including slope, coefficient of determination (R2), bias, and root mean squared error (RMSE). Besides that, the results also include reference y-values and array with predicted y-values. The array has dimension nObjects x nComponents x nResponses. PLS predictions for a new set can be obtained using method predict: res = predict(m, X.t, y.t) print(res) ## ## PLS results (class plsres) ## ## Call: ## plsres(y.pred = yp, y.ref = y.ref, ncomp.selected = object$ncomp.selected, ## xdecomp = xdecomp, ydecomp = ydecomp) ## ## Major fields: ## $ncomp.selected - number of selected components ## $yp - array with predicted y values ## $y - matrix with reference y values ## $rmse - root mean squared error ## $r2 - coefficient of determination ## $slope - slope for predicted vs. measured values ## $bias - bias for prediction vs. measured values ## $ydecomp - decomposition of y values (ldecomp object) ## $xdecomp - decomposition of x values (ldecomp object) Model validation Validation is implemented similar to PCA, the only difference is that you need to provide two datasets for a test set — one for predictors (x.test) and one for response (y.test) values. Cross-validation is very important for PLS as it helps to find optimal number of PLS components (so test set performance is more fair as in this case you do not use test set for optimization). Therefore, it is always recommended to use cross-validation. You probably have noticed a small warning we got when created the first PLS model in this chapter: m = pls(X.c, y.c, 7, scale = T, info = &quot;Shoesize prediction model&quot;) ## Warning in selectCompNum.pls(model): No validation results were found! When you create a model, it tries to select optimal number of components automatically (which, of course, you can always change later). To do that, the method uses RMSE values, calculated for different number of components and cross-validation predictions. So, if we do not use cross-validation, it warns use about this. There are two different ways/criteria for automatic selection. One is using first local minimum on the RMSE plot and second is so called Wold criterion, based on a ratio between PRESS values for current and next component. You can select which criterion to use by specifying parameter ncomp.selcrit (either 'min' or 'wold') as it is shown below. m1 = pls(X.c, y.c, 7, scale = T, cv = 1, ncomp.selcrit = &#39;min&#39;) show(m1$ncomp.selected) ## [1] 5 m2 = pls(X.c, y.c, 7, scale = T, cv = 1, ncomp.selcrit = &#39;wold&#39;) show(m2$ncomp.selected) ## [1] 4 And here are the RMSE plots (they are identical of course): par(mfrow = c(1, 2)) plotRMSE(m1) plotRMSE(m2) Parameter cv has the same format as for PCA. If it is a number, it will be used as number of segments for random cross-validation, e.g. if cv = 2 cross-validation with two segments will be carried out. For full cross-validation use cv = 1 like we did in the example above. For more advanced option you can provide a list with name of cross-validation method, number of segments and number of iterations, e.g. cv = list('rand', 4, 4) for running random cross-validation with four segments and four repetitions or cv = list('ven', 8) for systematic split into eight segments (venetian blinds). Method summary() for model shows performance statistics calculated using optimal number of components for each of the results. summary(m1) ## ## PLS model (class pls) summary ## ## Performance and validation: ## Number of selected components: 5 ## X cumexpvar Y cumexpvar RMSE Slope Bias RPD ## Cal 97.64 98.19 0.521 0.98 0e+00 7.59 ## CV 92.90 96.22 0.753 0.98 -2e-04 5.26 If you want more details run summary() for one of the result objects. summary(m1$calres) ## ## PLS regression results (class plsres) summary ## ## Response variable Shoesize: ## X expvar X cumexpvar Y expvar Y cumexpvar RMSE Slope Bias RPD ## Comp 1 50.505 50.505 93.779 93.779 0.966 0.938 0 4.1 ## Comp 2 20.979 71.484 2.926 96.705 0.703 0.967 0 5.6 ## Comp 3 8.667 80.151 0.917 97.622 0.597 0.976 0 6.6 ## Comp 4 5.847 85.998 0.479 98.101 0.534 0.981 0 7.4 ## Comp 5 11.642 97.640 0.088 98.189 0.521 0.982 0 7.6 ## Comp 6 0.495 98.135 0.347 98.536 0.468 0.985 0 8.4 ## Comp 7 0.442 98.577 0.202 98.738 0.435 0.987 0 9.1 There is no column for R2 as Y cumexpvar values are the same. "],
 ["plotting-methods-1.html", "Plotting methods", " Plotting methods Plotting methods, again, work similar to PCA, so in this section we will look more detailed on the available methods instead of on how to customize them. PLS has a lot of different results and much more possible plots. Here is a list of methods, which will work both for a model and for a particular results. Methods for summary statistics. Methods Description plotRMSE(obj, ny = 1, ...) RMSE values vs. number of components in a model plotXVariance(obj) explained variance for X decomposition for each component plotXCumVariance(obj) same as above but cumulative plotYVariance(obj) explained variance for Y decomposition for each component plotYCumVariance(obj) same as above but cumulative Here and in some other methods parameter ny is used to specify which y-variable you want to see a plot for (if y is multivariate). Methods for objects. Methods Description plotPredictions(obj, ny = 1, ncomp) Plot with predicted vs. measured (reference) y-values plotXScores(obj, comp) Scores for decompositon of X (similar to PCA scores plot) plotYScores(obj, comp) Scores for decompositon of y (similar to PCA scores plot) plotXResiduals(obj, ncomp) Residuals for decompositon of X (similar to PCA residuals plot) plotYResiduals(obj, ncomp) Residuals for y vs. real (reference) y-values plotXScores(obj, ncomp) Y-scores vs. X-scores for a particular PLS component. Parameter comp allows to provide a number of selected components (one or several) to show the plot for, while parameter ncomp assume that only one number is expected (number of components in a model or individual component). So if e.g. you created model for five components and selected three, you can also see, for example, prediction plot if you use only one or four components. Here is an example for m1 model: par(mfrow = c(1, 2)) plotPredictions(m1) plotPredictions(m1, ncomp = 1) The plots for variables are available only for a model object and include: Methods Description plotXLoadings(obj, comp) Loadings for decompositon of X (similar to PCA loadings plot) plotYLoadings(obj, comp) Loadings for decompositon of y (similar to PCA loadings plot) plotWeights(obj, comp) Weights (W) for PLS decomposition plotRegcoeffs(obj, ny, ncomp) Plot with regression coefficients plotVIPScores(obj, ny) VIP scores for the predictors plotSelectivityRation(obj, ny, ncomp) Selectivity ratio of the predictors And, of course, both model and result objects have method plot() for giving an overview. plot(m1) Excluding rows and columns From v. 0.8.0 PCA implementation as well as any other method in mdatools can exclude rows and columns from calculations. The implementation works similar to what was described for PCA. For example it can be useful if you have some candidates for outliers or do variable selection and do not want to remove rows and columns physically from the data matrix. In this case you can just specify two additional parameters, exclcols and exclrows, using either numbers or names of rows/columns to be excluded. You can also specify a vector with logical values (all TRUEs will be excluded). The excluded rows are not used for creating a model and calculation of model’s and results’ performance (e.g. explained variance). However main results (for PLS — scores, predictions, residuals) are calculated for these rows as well and set hidden, so you will not see them on plots. You can always e.g. show scores for excluded objects by using show.excluded = TRUE. It is implemented via attributes “known” for plotting methods from mdatools so if you use e.g. ggplot2 you will see all points. The excluded columns are not used for any calculations either, the corresponding results (e.g. loadings, weights or regression coefficients) will have zero values for such columns and be also hidden on plots. "],
-["variable-selection.html", "Variable selection", " Variable selection PLS calculates several statistics, which can be used to select most important (or remove least important) variables in order to improve performance and make model simpler. The first two are VIP-scores (variables important for projection) and Selectivity ratio. All details and theory can be found e.g. here. Both parameters can be shown as plots and as vector of values for a selected y-variable. Selectivity ration is calculated for all possible components in a model, but VIP scores (due to computational time) only for selected number of components and are recalculated every time you change number of optimal components using selectCompNum() method. Here are some plots. par(mfrow = c(2, 2)) plotVIPScores(m1, type = &#39;h&#39;, show.labels = T) plotSelectivityRatio(m1, type = &#39;b&#39;, show.labels = T) plotSelectivityRatio(m1, ncomp = 1, type = &#39;h&#39;, show.labels = T) plotSelectivityRatio(m1, ncomp = 2, type = &#39;h&#39;, show.labels = T) In the example below, I create two other PLS models by excluding variables with VIP score or selectivity ratio below a threshold (I use 0.5 and 1 correspondingly) and show the performance for both. m3 = pls(X.c, y.c, 5, scale = T, cv = 1, exclcols = getVIPScores(m1, ncomp = 2) &lt; 0.5) summary(m3) ## ## PLS model (class pls) summary ## ## Performance and validation: ## Number of selected components: 4 ## X cumexpvar Y cumexpvar RMSE Slope Bias RPD ## Cal 85.29 98.15 0.527 0.98 0.0000 7.50 ## CV 80.53 96.34 0.741 0.97 -0.0382 5.34 m4 = pls(X.c, y.c, 5, scale = T, cv = 1, exclcols = getSelectivityRatio(m1, ncomp = 2) &lt; 1) summary(m4) ## ## PLS model (class pls) summary ## ## Performance and validation: ## Number of selected components: 1 ## X cumexpvar Y cumexpvar RMSE Slope Bias RPD ## Cal 86.80 94.97 0.868 0.95 0.0000 4.56 ## CV 84.37 93.91 0.955 0.94 0.0034 4.14 Another way is make an inference about regression coefficients and calculate confidence intervals and p-values for each variable. This can be done usine Jack-Knife approach, when model is cross-validated using efficient number of segments (at least ten) and statistics are calculated using the distribution of regression coefficient values obtained for each step. There are two parameters, coeffs.ci and coeffs.alpha, first is to select the method (so far only Jack-Knife is available, the value is 'jk') and second is a level of significance for computing confidence intervals (by default is 0.1). Here is an example. mjk = pls(X.c, y.c, 7, scale = T, coeffs.ci = &#39;jk&#39;, coeffs.alpha = 0.05) If number of segments is not specified as in the example above, full cross-validation will be used. The statistics are calculated for each y-variable and each available number of components. When you show a plot for regression coefficients, confidence interval will be shown automatically. You can changes this by using parameter show.ci = FALS. par(mfrow = c(2, 2)) plotRegcoeffs(mjk, type = &#39;h&#39;, show.labels = T) plotRegcoeffs(mjk, ncomp = 2, type = &#39;h&#39;, show.labels = T) plotRegcoeffs(mjk, type = &#39;h&#39;, show.labels = T, show.ci = F) plotRegcoeffs(mjk, ncomp = 2, type = &#39;h&#39;, show.labels = T, show.ci = F) Function getRegcoeffs() in this case may also return a column with p-values, if user specifies a parameter full. show(getRegcoeffs(mjk, ncomp = 2, full = T)) ## Shoesize p-value ## Intercept 1.342626e+01 NA ## Height 7.456695e-02 2.116375e-18 ## Weight 4.896328e-02 5.012592e-18 ## Hairleng -6.865495e-01 1.137354e-14 ## Age 1.081716e-02 3.579832e-01 ## Income 5.642220e-06 7.032445e-01 ## Beer 5.010542e-03 2.136646e-06 ## Wine 7.511377e-03 1.204856e-02 ## Sex -6.865495e-01 1.137354e-14 ## Swim 1.010496e-01 3.941369e-13 ## Region 1.035071e-01 2.708059e-01 ## IQ -5.277164e-03 6.033516e-01 The p-values are stored as a 3-way array similar to regression coefficients. The selection can be made by comparing e.g. p-values with a threshold similar to what we have done with VIP-scores and selectivity ratio. exclcols = mjk$coeffs$p.values[, 2, 1] &gt; 0.05 show(exclcols) ## Height Weight Hairleng Age Income Beer Wine Sex ## FALSE FALSE FALSE TRUE TRUE FALSE FALSE FALSE ## Swim Region IQ ## FALSE TRUE TRUE Here p.values[, 2, 1] means values for all predictors, model with two components, first y-variable. newm = pls(X.c, y.c, 3, scale = T, cv = 1, exclcols = exclcols) summary(newm) ## ## PLS model (class pls) summary ## ## Performance and validation: ## Number of selected components: 3 ## X cumexpvar Y cumexpvar RMSE Slope Bias RPD ## Cal 97.85 97.79 0.575 0.98 0.0000 6.87 ## CV 96.64 96.49 0.727 0.97 -0.0161 5.44 show(getRegcoeffs(newm)) ## Shoesize ## Intercept 4.952691046 ## Height 0.091079963 ## Weight 0.052708955 ## Hairleng -0.315927643 ## Age 0.000000000 ## Income 0.000000000 ## Beer 0.009320427 ## Wine 0.018524717 ## Sex -0.315927643 ## Swim 0.134354170 ## Region 0.000000000 ## IQ 0.000000000 As you can see, the variables Age, Income, Region and IQ have been excluded as they are not related to the Shoesize, which seems to be correct. Variable selection as well as all described above can be also carried out for PLS discriminant analysis (PLS-DA), which can be explained later in one of the next chapters. -->"]
+["variable-selection.html", "Variable selection", " Variable selection PLS calculates several statistics, which can be used to select most important (or remove least important) variables in order to improve performance and make model simpler. The first two are VIP-scores (variables important for projection) and Selectivity ratio. All details and theory can be found e.g. here. Both parameters can be shown as plots and as vector of values for a selected y-variable. Selectivity ration is calculated for all possible components in a model, but VIP scores (due to computational time) only for selected number of components and are recalculated every time you change number of optimal components using selectCompNum() method. Here are some plots. par(mfrow = c(2, 2)) plotVIPScores(m1, type = &#39;h&#39;, show.labels = T) plotSelectivityRatio(m1, type = &#39;b&#39;, show.labels = T) plotSelectivityRatio(m1, ncomp = 1, type = &#39;h&#39;, show.labels = T) plotSelectivityRatio(m1, ncomp = 2, type = &#39;h&#39;, show.labels = T) In the example below, I create two other PLS models by excluding variables with VIP score or selectivity ratio below a threshold (I use 0.5 and 1 correspondingly) and show the performance for both. m3 = pls(X.c, y.c, 5, scale = T, cv = 1, exclcols = getVIPScores(m1, ncomp = 2) &lt; 0.5) summary(m3) ## ## PLS model (class pls) summary ## ## Performance and validation: ## Number of selected components: 4 ## X cumexpvar Y cumexpvar RMSE Slope Bias RPD ## Cal 85.29 98.15 0.527 0.98 0.0000 7.50 ## CV 80.53 96.34 0.741 0.97 -0.0382 5.34 m4 = pls(X.c, y.c, 5, scale = T, cv = 1, exclcols = getSelectivityRatio(m1, ncomp = 2) &lt; 1) summary(m4) ## ## PLS model (class pls) summary ## ## Performance and validation: ## Number of selected components: 1 ## X cumexpvar Y cumexpvar RMSE Slope Bias RPD ## Cal 86.80 94.97 0.868 0.95 0.0000 4.56 ## CV 84.37 93.91 0.955 0.94 0.0034 4.14 Another way is make an inference about regression coefficients and calculate confidence intervals and p-values for each variable. This can be done usine Jack-Knife approach, when model is cross-validated using efficient number of segments (at least ten) and statistics are calculated using the distribution of regression coefficient values obtained for each step. There are two parameters, coeffs.ci and coeffs.alpha, first is to select the method (so far only Jack-Knife is available, the value is 'jk') and second is a level of significance for computing confidence intervals (by default is 0.1). Here is an example. mjk = pls(X.c, y.c, 7, scale = T, coeffs.ci = &#39;jk&#39;, coeffs.alpha = 0.05) If number of segments is not specified as in the example above, full cross-validation will be used. The statistics are calculated for each y-variable and each available number of components. When you show a plot for regression coefficients, confidence interval will be shown automatically. You can changes this by using parameter show.ci = FALS. par(mfrow = c(2, 2)) plotRegcoeffs(mjk, type = &#39;h&#39;, show.labels = T) plotRegcoeffs(mjk, ncomp = 2, type = &#39;h&#39;, show.labels = T) plotRegcoeffs(mjk, type = &#39;h&#39;, show.labels = T, show.ci = F) plotRegcoeffs(mjk, ncomp = 2, type = &#39;h&#39;, show.labels = T, show.ci = F) Function getRegcoeffs() in this case may also return a column with p-values, if user specifies a parameter full. show(getRegcoeffs(mjk, ncomp = 2, full = T)) ## Shoesize p-value ## Intercept 1.342626e+01 NA ## Height 7.456695e-02 2.116375e-18 ## Weight 4.896328e-02 5.012592e-18 ## Hairleng -6.865495e-01 1.137354e-14 ## Age 1.081716e-02 3.579832e-01 ## Income 5.642220e-06 7.032445e-01 ## Beer 5.010542e-03 2.136646e-06 ## Wine 7.511377e-03 1.204856e-02 ## Sex -6.865495e-01 1.137354e-14 ## Swim 1.010496e-01 3.941369e-13 ## Region 1.035071e-01 2.708059e-01 ## IQ -5.277164e-03 6.033516e-01 The p-values are stored as a 3-way array similar to regression coefficients. The selection can be made by comparing e.g. p-values with a threshold similar to what we have done with VIP-scores and selectivity ratio. exclcols = mjk$coeffs$p.values[, 2, 1] &gt; 0.05 show(exclcols) ## Height Weight Hairleng Age Income Beer Wine Sex ## FALSE FALSE FALSE TRUE TRUE FALSE FALSE FALSE ## Swim Region IQ ## FALSE TRUE TRUE Here p.values[, 2, 1] means values for all predictors, model with two components, first y-variable. newm = pls(X.c, y.c, 3, scale = T, cv = 1, exclcols = exclcols) summary(newm) ## ## PLS model (class pls) summary ## ## Performance and validation: ## Number of selected components: 3 ## X cumexpvar Y cumexpvar RMSE Slope Bias RPD ## Cal 97.85 97.79 0.575 0.98 0.0000 6.87 ## CV 96.64 96.49 0.727 0.97 -0.0161 5.44 show(getRegcoeffs(newm)) ## Shoesize ## Intercept 4.952691046 ## Height 0.091079963 ## Weight 0.052708955 ## Hairleng -0.315927643 ## Age 0.000000000 ## Income 0.000000000 ## Beer 0.009320427 ## Wine 0.018524717 ## Sex -0.315927643 ## Swim 0.134354170 ## Region 0.000000000 ## IQ 0.000000000 As you can see, the variables Age, Income, Region and IQ have been excluded as they are not related to the Shoesize, which seems to be correct. Variable selection as well as all described above can be also carried out for PLS discriminant analysis (PLS-DA), which can be explained later in one of the next chapters. -->"],
+["simca-classification.html", "SIMCA classification", " SIMCA classification SIMCA (Soft Independent Modelling of Class Analogy) is a simple one-class classification method mainly based on PCA. The general idea is to create a PCA model using data for samples/objects belonging to a class and classify new objects based on how good the model can fit them. The decision is made using two residual distances — \\(Q\\) (squared residual distance from an object to its projection to PCA space) and \\(T^2\\) - distance between the projection of the object and origin of PC space. The \\(T^2\\) distance is calculated for normalized scores. The first distance (also known as “orthogonal distance”) shows how good the new object following the same trend as the other objects from the class used to create the model, while the second (also known as “score distance”) tells how extreme is it. Both distances may have certain statistical limits, which can be used to cut-off the strangers and accept class members with a pre-define expected ratio of false negatives (\\(\\alpha\\)). There are several ways to calculate the limits, for example, see this paper. In mdatools so far we use a simplest way, suggested by Svante Wold, where the limit for orthogonal distance is calculated using F-distribution and the score distance is computed using Hotelling T2 distribution. More methods will be available in future releases. The classification performance is assessed using true/false positives and negatives and statistics, showing the ability of a classification model to recognize class members (sensitivity or true positive rate) and how good the model is for identifying strangers (specificity or true negative rate). In addition to that, model also calculates a percent of misclassified objects. All statistics are calculated for calibration and validation (if any) results, but one must be aware that specificity can not be computed without objects not belonging to the class and, therefore, calibration and cross-validation results in SIMCA do not have specificity values. It must be also noted that any SIMCA model or result is also a PCA object and all plots, methods, statistics, available for PCA, can be used for SIMCA objects as well. "],
+["calibration-and-validation.html", "Calibration and validation", " Calibration and validation The model calibration is similar to PCA, but there are several additional arguments, which are important for classification. First of all it is a class name. Class name is a string, which can be used later e.g. for identifying class members for testing. The second important argument is a level of significance, alpha. This parameter is used for calculation of statistical limits and can be considered as probability for false negatives. The default value is 0.05. In this chapter as well as for describing other classification methods we will use a famous Iris dataset, available in R. The dataset includes 150 measurements of three Iris species: Setosa, Virginica and Versicola. The measurements are length and width of petals and sepals in cm. Use ?iris for more details. Let’s get the data and split it to calibration and test sets. data(iris) head(iris) ## Sepal.Length Sepal.Width Petal.Length Petal.Width Species ## 1 5.1 3.5 1.4 0.2 setosa ## 2 4.9 3.0 1.4 0.2 setosa ## 3 4.7 3.2 1.3 0.2 setosa ## 4 4.6 3.1 1.5 0.2 setosa ## 5 5.0 3.6 1.4 0.2 setosa ## 6 5.4 3.9 1.7 0.4 setosa # generate indices for calibration set idx = seq(1, nrow(iris), by = 2) # split the values X.c = iris[idx, 1:4] c.c = iris[idx, 5, drop = F] X.t = iris[-idx, 1:4] c.t = iris[-idx, 5, drop = F] Now, because for calibration we need only objects belonging to a class, we will split the X.c into three matrices — one for each species. The data is ordered by the species, so it can be done relatively easy by taking every 25 rows. X.set = X.c[1:25, ] X.ver = X.c[26:50, ] X.vir = X.c[51:75, ] Let’s start with creating a model for class Versicolor and exploring available statistics and plots. We will use full cross-validation to validate the results. library(mdatools) m = simca(X.ver, &#39;versicolor&#39;, ncomp = 3, cv = 1) summary(m) ## ## SIMCA model for class &quot;versicolor&quot; summary ## ## Info: ## Significance level (alpha): 0.05 ## Selected number of components: 3 ## ## Expvar Cumexpvar Sens (cal) Expvar (cv) Sens (cv) ## Comp 1 76.44 76.44 0.96 71.85 0.88 ## Comp 2 13.93 90.37 0.92 13.91 0.84 ## Comp 3 8.45 98.82 0.92 12.24 0.84 Let’s look at plots and start with summary plot. plot(m) The plot is very similar to what we seen for PCA model, the only difference is that it shows modelling power instead of loadings. Modelling power is a measure of contribution of each variable to the model and varies from 0 to 1. Usually variables with modelling power below 0.1 are considered as irrelevant. Let’s give a closer look at the residuals plot with different values for alpha (we will keep number of components equal to three in all cases). m1 = simca(X.ver, &#39;versicolor&#39;, ncomp = 3, cv = 1, alpha = 0.01) m2 = simca(X.ver, &#39;versicolor&#39;, ncomp = 3, cv = 1, alpha = 0.05) m3 = simca(X.ver, &#39;versicolor&#39;, ncomp = 3, cv = 1, alpha = 0.10) m4 = simca(X.ver, &#39;versicolor&#39;, ncomp = 3, cv = 1, alpha = 0.15) par(mfrow = c(2, 2)) plotResiduals(m1) plotResiduals(m2) plotResiduals(m3) plotResiduals(m4) As you can see, using alpha = 0.01 reduced number of false negatives to zero, as the acceptance limits became larger, while alpha = 0.15 gives a lot of incorrectly rejected class members. It must be noted, that decreasing alpha will also lead to a larger number of false positives, which we can not see in this case. Predictions and validation with a test set When model is ready one can test it using a new test set with know classes. In this case we will use objects from all three species and be able to see how good the model performs on strangers (and calculate the specificity). In order to do that we will provide both the matrix with predictors, X.t, and a vector with names of the classes for corresponding objects/rows (c.t). The values with known classes in this case can be: a vector with text values (names) a factor using the names as labels a vector with logical values (TRUE for class members and FALSE for strangers) In our case we have a factor. Instead of creating a new model and providing the values as test set we will make predictions instead. res = predict(m, X.t, c.t) summary(res) ## ## Summary for SIMCA one-class classification result ## ## Class name: versicolor ## Number of selected components: 3 ## ## Expvar Cumexpvar TP FP TN FN Spec Sens ## Comp 1 64.27 64.27 23 5 45 2 0.90 0.92 ## Comp 2 1.67 65.95 24 3 47 1 0.94 0.96 ## Comp 3 32.45 98.40 22 3 47 3 0.94 0.88 In this case we see a more detailed statistics with true/false positives and negatives, specificity and sensitivity. The performance statistics can be also shown as plots. par(mfrow = c(2, 2)) plotSpecificity(res) plotSensitivity(res) plotMisclassified(res) plotPerformance(res) The classification results can be shown both graphically and numerically. Here is a prediction plot for the results. par(mfrow = c(2, 1)) plotPredictions(res) plotPredictions(res, ncomp = 2) So we can see that for the model with three components we have no false positives (specificity = 1) and one false negative (sensitivity = 24/25 = 0.96). You can also show the predictions as a matrix with -1 and +1 using method showPredictions() or get the array with predicted class values directly as it is shown in the example below (for first 10 rows, different number of components and the first classification variable). show(res$c.pred[31:40, 1:3, 1]) ## Comp 1 Comp 2 Comp 3 ## 62 1 1 1 ## 64 1 1 1 ## 66 1 1 1 ## 68 1 1 -1 ## 70 1 1 1 ## 72 1 1 1 ## 74 1 1 -1 ## 76 1 1 1 ## 78 1 1 1 ## 80 1 1 1 "],
+["multiclass-classification.html", "Multiclass classification", " Multiclass classification Several SIMCA models can be combined to a special object simcam, which is used to make a multiclass classification. Besides this, it also allows calculating distance between individual models and a discrimination power — importance of variables to discriminate between any two classes. Let’s see how it works. First we create three single-class SIMCA models with individual settings, such as number of optimal components and alpha. m.set = simca(X.set, &#39;setosa&#39;, 3, alpha = 0.01) m.set = selectCompNum(m.set, 1) m.vir = simca(X.vir, &#39;virginica&#39;, 3) m.vir = selectCompNum(m.vir, 2) m.ver = simca(X.ver, &#39;versicola&#39;, 3) m.ver = selectCompNum(m.ver, 1) Then we combine the models into a SIMCAM model object. Summary will show the performance on calibration set, which is a combination of calibration sets for each of the individual models m = simcam(list(m.set, m.vir, m.ver)) summary(m) ## ## SIMCA multiple classes classification (class simcam) ## Nmber of classes: 3 ## Info: ## ## SIMCA model for class &quot;setosa&quot; summary ## ## Info: ## Significance level (alpha): 0.01 ## Selected number of components: 1 ## ## Expvar Cumexpvar Sens (cal) ## Comp 1 73.51 73.51 1 ## Comp 2 14.24 87.76 1 ## Comp 3 10.44 98.20 1 ## ## SIMCA model for class &quot;virginica&quot; summary ## ## Info: ## Significance level (alpha): 0.05 ## Selected number of components: 2 ## ## Expvar Cumexpvar Sens (cal) ## Comp 1 76.16 76.16 0.88 ## Comp 2 14.94 91.10 1.00 ## Comp 3 6.09 97.20 0.96 ## ## SIMCA model for class &quot;versicola&quot; summary ## ## Info: ## Significance level (alpha): 0.05 ## Selected number of components: 1 ## ## Expvar Cumexpvar Sens (cal) ## Comp 1 76.44 76.44 0.96 ## Comp 2 13.93 90.37 0.92 ## Comp 3 8.45 98.82 0.92 Now we apply the combined model to the test set and look at the predictions. res = predict(m, X.t, c.t) plotPredictions(res) In this case the predictions are shown only for the number of components each model found optimal. The names of classes along y-axis are the individual models. Similarly we can show the predicted values. show(res$c.pred[20:30, 1, 1:3]) ## setosa virginica versicola ## 40 1 -1 -1 ## 42 -1 -1 -1 ## 44 1 -1 -1 ## 46 1 -1 -1 ## 48 1 -1 -1 ## 50 1 -1 -1 ## 52 -1 -1 1 ## 54 -1 -1 1 ## 56 -1 1 1 ## 58 -1 -1 -1 ## 60 -1 -1 1 There are three additional plots available for multiclass SIMCA model. First of all it is a distance between a selected model and the others. par(mfrow = c(1, 2)) plotModelDistance(m, 1) plotModelDistance(m, 2) The second plot is a discrimination power, mentioned in the beginning of the section. par(mfrow = c(1, 2)) plotDiscriminationPower(m, c(1, 3), show.labels = T) plotDiscriminationPower(m, c(2, 3), show.labels = T) And, finally, a Cooman’s plot showing an orthogonal distance from objects to two selected classes/models. par(mfrow = c(1, 2)) plotCooman(m, c(1, 3), show.labels = T) plotCooman(m, c(2, 3), show.labels = T) -->"]
 ]
diff --git a/docs/simca-classification.html b/docs/simca-classification.html
new file mode 100644
index 0000000..ac544f5
--- /dev/null
+++ b/docs/simca-classification.html
@@ -0,0 +1,249 @@
+<!DOCTYPE html>
+<html >
+
+<head>
+
+  <meta charset="UTF-8">
+  <meta http-equiv="X-UA-Compatible" content="IE=edge">
+  <title>Getting started with mdatools for R</title>
+  <meta content="text/html; charset=UTF-8" http-equiv="Content-Type">
+  <meta name="description" content="This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect most of the common chemometric methods and give a similar user interface for using them. So if a user knows how to make a model and visualise results for one method, he or she can easily do this for the others.">
+  <meta name="generator" content="bookdown 0.1 and GitBook 2.6.7">
+
+  <meta property="og:title" content="Getting started with mdatools for R" />
+  <meta property="og:type" content="book" />
+  
+  
+  <meta property="og:description" content="This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect most of the common chemometric methods and give a similar user interface for using them. So if a user knows how to make a model and visualise results for one method, he or she can easily do this for the others." />
+  <meta name="github-repo" content="svkucheryavski/mdatools.bookdown" />
+
+  <meta name="twitter:card" content="summary" />
+  <meta name="twitter:title" content="Getting started with mdatools for R" />
+  
+  <meta name="twitter:description" content="This is a user guide for mdatools — R package for preprocessing, exploring and analysis of multivariate data. The package provides methods mostly common for Chemometrics. The general idea of the package is to collect most of the common chemometric methods and give a similar user interface for using them. So if a user knows how to make a model and visualise results for one method, he or she can easily do this for the others." />
+  
+
+<meta name="author" content="Sergey Kucheryavskiy">
+
+<meta name="date" content="2016-10-30">
+
+<script type="text/x-mathjax-config">
+MathJax.Hub.Config({
+  TeX: { equationNumbers: { autoNumber: "AMS" } }
+});
+</script>
+
+  <meta name="viewport" content="width=device-width, initial-scale=1">
+  <meta name="apple-mobile-web-app-capable" content="yes">
+  <meta name="apple-mobile-web-app-status-bar-style" content="black">
+  
+  
+<link rel="prev" href="variable-selection.html">
+<link rel="next" href="calibration-and-validation.html">
+
+<script src="libs/jquery-2.2.3/jquery.min.js"></script>
+<link href="libs/gitbook-2.6.7/css/style.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-bookdown.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-highlight.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-search.css" rel="stylesheet" />
+<link href="libs/gitbook-2.6.7/css/plugin-fontsettings.css" rel="stylesheet" />
+
+
+
+
+
+
+
+
+
+<style type="text/css">
+div.sourceCode { overflow-x: auto; }
+table.sourceCode, tr.sourceCode, td.lineNumbers, td.sourceCode {
+  margin: 0; padding: 0; vertical-align: baseline; border: none; }
+table.sourceCode { width: 100%; line-height: 100%; }
+td.lineNumbers { text-align: right; padding-right: 4px; padding-left: 4px; color: #aaaaaa; border-right: 1px solid #aaaaaa; }
+td.sourceCode { padding-left: 5px; }
+code > span.kw { color: #007020; font-weight: bold; } /* Keyword */
+code > span.dt { color: #902000; } /* DataType */
+code > span.dv { color: #40a070; } /* DecVal */
+code > span.bn { color: #40a070; } /* BaseN */
+code > span.fl { color: #40a070; } /* Float */
+code > span.ch { color: #4070a0; } /* Char */
+code > span.st { color: #4070a0; } /* String */
+code > span.co { color: #60a0b0; font-style: italic; } /* Comment */
+code > span.ot { color: #007020; } /* Other */
+code > span.al { color: #ff0000; font-weight: bold; } /* Alert */
+code > span.fu { color: #06287e; } /* Function */
+code > span.er { color: #ff0000; font-weight: bold; } /* Error */
+code > span.wa { color: #60a0b0; font-weight: bold; font-style: italic; } /* Warning */
+code > span.cn { color: #880000; } /* Constant */
+code > span.sc { color: #4070a0; } /* SpecialChar */
+code > span.vs { color: #4070a0; } /* VerbatimString */
+code > span.ss { color: #bb6688; } /* SpecialString */
+code > span.im { } /* Import */
+code > span.va { color: #19177c; } /* Variable */
+code > span.cf { color: #007020; font-weight: bold; } /* ControlFlow */
+code > span.op { color: #666666; } /* Operator */
+code > span.bu { } /* BuiltIn */
+code > span.ex { } /* Extension */
+code > span.pp { color: #bc7a00; } /* Preprocessor */
+code > span.at { color: #7d9029; } /* Attribute */
+code > span.do { color: #ba2121; font-style: italic; } /* Documentation */
+code > span.an { color: #60a0b0; font-weight: bold; font-style: italic; } /* Annotation */
+code > span.cv { color: #60a0b0; font-weight: bold; font-style: italic; } /* CommentVar */
+code > span.in { color: #60a0b0; font-weight: bold; font-style: italic; } /* Information */
+</style>
+
+</head>
+
+<body>
+
+
+  <div class="book without-animation with-summary font-size-2 font-family-1" data-basepath=".">
+
+    <div class="book-summary">
+      <nav role="navigation">
+
+<ul class="summary">
+<li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
+<li class="chapter" data-level="" data-path="what-mdatools-can-do.html"><a href="what-mdatools-can-do.html"><i class="fa fa-check"></i>What mdatools can do?</a></li>
+<li class="chapter" data-level="" data-path="how-to-install.html"><a href="how-to-install.html"><i class="fa fa-check"></i>How to install</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="datasets-and-plots.html"><a href="datasets-and-plots.html"><i class="fa fa-check"></i>Datasets and plots</a><ul>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html"><i class="fa fa-check"></i>Attributes and factors</a><ul>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#package-specific-attributes"><i class="fa fa-check"></i>Package specific attributes</a></li>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#attributes-for-plots"><i class="fa fa-check"></i>Attributes for plots</a></li>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#special-methods-for-data-transformations"><i class="fa fa-check"></i>Special methods for data transformations</a></li>
+<li class="chapter" data-level="" data-path="attributes-and-factors.html"><a href="attributes-and-factors.html#data-frames-with-factors"><i class="fa fa-check"></i>Data frames with factors</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html"><i class="fa fa-check"></i>Simple plots</a><ul>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html#scatter-plots"><i class="fa fa-check"></i>Scatter plots</a></li>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html#line-plots"><i class="fa fa-check"></i>Line plots</a></li>
+<li class="chapter" data-level="" data-path="simple-plots.html"><a href="simple-plots.html#bar-and-errorbar-plots"><i class="fa fa-check"></i>Bar and errorbar plots</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html"><i class="fa fa-check"></i>Plots for groups of objects</a><ul>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html#one-matrix-or-data-frame"><i class="fa fa-check"></i>One matrix or data frame</a></li>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html#list-with-matrices-or-data-frames"><i class="fa fa-check"></i>List with matrices or data frames</a></li>
+<li class="chapter" data-level="" data-path="plots-for-groups-of-objects.html"><a href="plots-for-groups-of-objects.html#use-factors-to-split-a-dataset-into-groups"><i class="fa fa-check"></i>Use factors to split a dataset into groups</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="working-with-images.html"><a href="working-with-images.html"><i class="fa fa-check"></i>Working with images</a></li>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html"><i class="fa fa-check"></i>Preprocessing</a><ul>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html#autoscaling"><i class="fa fa-check"></i>Autoscaling</a></li>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html#correction-of-spectral-baseline"><i class="fa fa-check"></i>Correction of spectral baseline</a></li>
+<li class="chapter" data-level="" data-path="preprocessing.html"><a href="preprocessing.html#smoothing-and-derivatives"><i class="fa fa-check"></i>Smoothing and derivatives</a></li>
+</ul></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="principal-component-analysis.html"><a href="principal-component-analysis.html"><i class="fa fa-check"></i>Principal component analysis</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results.html"><a href="models-and-results.html"><i class="fa fa-check"></i>Models and results</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results.html"><a href="models-and-results.html#model-calibration"><i class="fa fa-check"></i>Model calibration</a></li>
+<li class="chapter" data-level="" data-path="models-and-results.html"><a href="models-and-results.html#model-validation"><i class="fa fa-check"></i>Model validation</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html"><i class="fa fa-check"></i>Plotting methods</a><ul>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html#support-for-images"><i class="fa fa-check"></i>Support for images</a></li>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html#manual-x-values-for-loading-line-plot"><i class="fa fa-check"></i>Manual x-values for loading line plot</a></li>
+<li class="chapter" data-level="" data-path="plotting-methods.html"><a href="plotting-methods.html#excluding-rows-and-columns"><i class="fa fa-check"></i>Excluding rows and columns</a></li>
+</ul></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="partial-least-squares-regression.html"><a href="partial-least-squares-regression.html"><i class="fa fa-check"></i>Partial least squares regression</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results-1.html"><a href="models-and-results-1.html"><i class="fa fa-check"></i>Models and results</a><ul>
+<li class="chapter" data-level="" data-path="models-and-results-1.html"><a href="models-and-results-1.html#model-calibration-1"><i class="fa fa-check"></i>Model calibration</a></li>
+<li class="chapter" data-level="" data-path="models-and-results-1.html"><a href="models-and-results-1.html#model-validation-1"><i class="fa fa-check"></i>Model validation</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="plotting-methods-1.html"><a href="plotting-methods-1.html"><i class="fa fa-check"></i>Plotting methods</a><ul>
+<li class="chapter" data-level="" data-path="plotting-methods-1.html"><a href="plotting-methods-1.html#excluding-rows-and-columns-1"><i class="fa fa-check"></i>Excluding rows and columns</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
+</ul>
+
+      </nav>
+    </div>
+
+    <div class="book-body">
+      <div class="body-inner">
+        <div class="book-header" role="navigation">
+          <h1>
+            <i class="fa fa-circle-o-notch fa-spin"></i><a href="./">Getting started with mdatools for R</a>
+          </h1>
+        </div>
+
+        <div class="page-wrapper" tabindex="-1" role="main">
+          <div class="page-inner">
+
+            <section class="normal" id="section-">
+<div id="simca-classification" class="section level1 unnumbered">
+<h1>SIMCA classification</h1>
+<p>SIMCA (Soft Independent Modelling of Class Analogy) is a simple one-class classification method mainly based on PCA. The general idea is to create a PCA model using data for samples/objects belonging to a class and classify new objects based on how good the model can fit them. The decision is made using two residual distances — <span class="math inline">\(Q\)</span> (squared residual distance from an object to its projection to PCA space) and <span class="math inline">\(T^2\)</span> - distance between the projection of the object and origin of PC space. The <span class="math inline">\(T^2\)</span> distance is calculated for normalized scores.</p>
+<p>The first distance (also known as “orthogonal distance”) shows how good the new object following the same trend as the other objects from the class used to create the model, while the second (also known as “score distance”) tells how extreme is it. Both distances may have certain statistical limits, which can be used to cut-off the strangers and accept class members with a pre-define expected ratio of false negatives (<span class="math inline">\(\alpha\)</span>). There are several ways to calculate the limits, for example, see <a href="http://onlinelibrary.wiley.com/doi/10.1002/cem.1147/abstract">this paper</a>. In <em>mdatools</em> so far we use a simplest way, suggested by Svante Wold, where the limit for orthogonal distance is calculated using F-distribution and the score distance is computed using Hotelling T<sup>2</sup> distribution. More methods will be available in future releases.</p>
+<p>The classification performance is assessed using true/false positives and negatives and statistics, showing the ability of a classification model to recognize class members (<em>sensitivity</em> or true positive rate) and how good the model is for identifying strangers (<em>specificity</em> or true negative rate). In addition to that, model also calculates a percent of misclassified objects. All statistics are calculated for calibration and validation (if any) results, but one must be aware that specificity can not be computed without objects not belonging to the class and, therefore, calibration and cross-validation results in SIMCA do not have specificity values.</p>
+<p>It must be also noted that any SIMCA model or result is also a PCA object and all plots, methods, statistics, available for PCA, can be used for SIMCA objects as well.</p> 
+</div>
+            </section>
+
+          </div>
+        </div>
+      </div>
+<a href="variable-selection.html" class="navigation navigation-prev " aria-label="Previous page"><i class="fa fa-angle-left"></i></a>
+<a href="calibration-and-validation.html" class="navigation navigation-next " aria-label="Next page""><i class="fa fa-angle-right"></i></a>
+
+<script src="libs/gitbook-2.6.7/js/app.min.js"></script>
+<script src="libs/gitbook-2.6.7/js/lunr.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-search.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-sharing.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-fontsettings.js"></script>
+<script src="libs/gitbook-2.6.7/js/plugin-bookdown.js"></script>
+<script src="libs/gitbook-2.6.7/js/jquery.highlight.js"></script>
+<script>
+require(["gitbook"], function(gitbook) {
+gitbook.start({
+"sharing": {
+"facebook": true,
+"twitter": true,
+"google": false,
+"weibo": false,
+"instapper": false,
+"vk": false,
+"all": ["facebook", "google", "twitter", "weibo", "instapaper"]
+},
+"fontsettings": {
+"theme": "white",
+"family": "sans",
+"size": 1
+},
+"edit": {
+"link": null,
+"text": null
+},
+"download": null,
+"toc": {
+"collapse": "subsection"
+}
+});
+});
+</script>
+
+<!-- dynamically load mathjax for compatibility with self-contained -->
+<script>
+  (function () {
+    var script = document.createElement("script");
+    script.type = "text/javascript";
+    script.src  = "https://cdn.mathjax.org/mathjax/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML";
+    if (location.protocol !== "file:" && /^https?:/.test(script.src))
+      script.src  = script.src.replace(/^https?:/, '');
+    document.getElementsByTagName("head")[0].appendChild(script);
+  })();
+</script>
+</body>
+
+</html>
diff --git a/docs/simple-plots.html b/docs/simple-plots.html
index 92181b2..597e9c4 100644
--- a/docs/simple-plots.html
+++ b/docs/simple-plots.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/variable-selection.html b/docs/variable-selection.html
index 03925a2..1a34cbb 100644
--- a/docs/variable-selection.html
+++ b/docs/variable-selection.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -39,7 +39,7 @@
   
   
 <link rel="prev" href="plotting-methods-1.html">
-
+<link rel="next" href="simca-classification.html">
 
 <script src="libs/jquery-2.2.3/jquery.min.js"></script>
 <link href="libs/gitbook-2.6.7/css/style.css" rel="stylesheet" />
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
@@ -274,8 +280,8 @@ <h2>Variable selection</h2>
           </div>
         </div>
       </div>
-<a href="plotting-methods-1.html" class="navigation navigation-prev navigation-unique" aria-label="Previous page"><i class="fa fa-angle-left"></i></a>
-
+<a href="plotting-methods-1.html" class="navigation navigation-prev " aria-label="Previous page"><i class="fa fa-angle-left"></i></a>
+<a href="simca-classification.html" class="navigation navigation-next " aria-label="Next page""><i class="fa fa-angle-right"></i></a>
 
 <script src="libs/gitbook-2.6.7/js/app.min.js"></script>
 <script src="libs/gitbook-2.6.7/js/lunr.js"></script>
diff --git a/docs/what-is-new.html b/docs/what-is-new.html
index b8febce..9f37217 100644
--- a/docs/what-is-new.html
+++ b/docs/what-is-new.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
@@ -178,8 +184,8 @@ <h1>
             <section class="normal" id="section-">
 <div id="what-is-new" class="section level1 unnumbered">
 <h1>What is new</h1>
-<div id="what-to-expect-from-future-releases" class="section level3 unnumbered">
-<h3>What to expect from future releases</h3>
+<div id="what-expect-from-future-releases" class="section level3 unnumbered">
+<h3>What expect from future releases</h3>
 <p><strong>Book</strong></p>
 <ul>
 <li>Chapters about classification (SIMCA, SIMCA for multiple classes, PLS-DA)</li>
@@ -196,6 +202,12 @@ <h3>What to expect from future releases</h3>
 </div>
 <div id="last-changes-and-improvements-to-book-and-package" class="section level3 unnumbered">
 <h3>Last changes and improvements to book and package</h3>
+<p><strong>30.10.2016</strong></p>
+<ul>
+<li>fixed a bug in PCA when explained variance was calculated incorrectly for data with excluded rows</li>
+<li>fixed several issues with SIMCA (cross-validation) and SIMCAM (Cooman’s plot)</li>
+<li>added a chapter about SIMCA to the tutorial</li>
+</ul>
 <p><strong>14.10.2016</strong></p>
 <p>The new version (0.8.0) brings a lot of new features, therefore it was decided to rewrite this tutorial completely and start this log from the scratch. Most of the things available in the previous version of the package will work without any changes. But if you have been using functions <code>mdaplot()</code> and <code>mdaplotg()</code> it makes sense to read how the new implementation works and rewrite your code. The use of plotting tools became much simpler and more efficient. The main changes in the package are:</p>
 <ul>
diff --git a/docs/what-mdatools-can-do.html b/docs/what-mdatools-can-do.html
index 6630025..8b84b87 100644
--- a/docs/what-mdatools-can-do.html
+++ b/docs/what-mdatools-can-do.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>
diff --git a/docs/working-with-images.html b/docs/working-with-images.html
index 0626b95..18c8476 100644
--- a/docs/working-with-images.html
+++ b/docs/working-with-images.html
@@ -25,7 +25,7 @@
 
 <meta name="author" content="Sergey Kucheryavskiy">
 
-<meta name="date" content="2016-10-16">
+<meta name="date" content="2016-10-30">
 
 <script type="text/x-mathjax-config">
 MathJax.Hub.Config({
@@ -107,7 +107,7 @@
 <ul class="summary">
 <li class="chapter" data-level="" data-path="index.html"><a href="index.html"><i class="fa fa-check"></i>Introduction</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html"><i class="fa fa-check"></i>What is new</a><ul>
-<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-to-expect-from-future-releases"><i class="fa fa-check"></i>What to expect from future releases</a></li>
+<li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#what-expect-from-future-releases"><i class="fa fa-check"></i>What expect from future releases</a></li>
 <li class="chapter" data-level="" data-path="what-is-new.html"><a href="what-is-new.html#last-changes-and-improvements-to-book-and-package"><i class="fa fa-check"></i>Last changes and improvements to book and package</a></li>
 </ul></li>
 <li class="chapter" data-level="" data-path="overview.html"><a href="overview.html"><i class="fa fa-check"></i>Overview</a><ul>
@@ -159,6 +159,12 @@
 </ul></li>
 <li class="chapter" data-level="" data-path="variable-selection.html"><a href="variable-selection.html"><i class="fa fa-check"></i>Variable selection</a></li>
 </ul></li>
+<li class="chapter" data-level="" data-path="simca-classification.html"><a href="simca-classification.html"><i class="fa fa-check"></i>SIMCA classification</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html"><i class="fa fa-check"></i>Calibration and validation</a><ul>
+<li class="chapter" data-level="" data-path="calibration-and-validation.html"><a href="calibration-and-validation.html#predictions-and-validation-with-a-test-set"><i class="fa fa-check"></i>Predictions and validation with a test set</a></li>
+</ul></li>
+<li class="chapter" data-level="" data-path="multiclass-classification.html"><a href="multiclass-classification.html"><i class="fa fa-check"></i>Multiclass classification</a></li>
+</ul></li>
 </ul>
 
       </nav>