File: princomp.sci

package info (click to toggle)
scilab 5.2.2-9
  • links: PTS, VCS
  • area: main
  • in suites: squeeze
  • size: 334,832 kB
  • ctags: 52,586
  • sloc: xml: 526,945; ansic: 223,590; fortran: 163,080; java: 56,934; cpp: 33,840; tcl: 27,936; sh: 20,397; makefile: 9,908; ml: 9,451; perl: 1,323; cs: 614; lisp: 30
file content (77 lines) | stat: -rw-r--r-- 2,242 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
// Scilab ( http://www.scilab.org/ ) - This file is part of Scilab
// Copyright (C) 2000 - INRIA - Carlos Klimann
// 
// This file must be used under the terms of the CeCILL.
// This source file is licensed as described in the file COPYING, which
// you should have received as part of this distribution.  The terms
// are also available at
// http://www.cecill.info/licences/Licence_CeCILL_V2-en.txt
// 

function [facpr,comprinc,lambda,tsquare]=princomp(x,eco)
//
//This  function performs  several  computations known  as
//"principal component  analysis". 
//The  idea  behind this  method  is  to  represent in  an
//approximative  manner a  cluster of  n individuals  in a
//smaller  dimensional subspace.  In order  to do  that it
//projects the cluster onto a subspace.  The choice of the
//k-dimensional projection subspace is  made in such a way
//that  the distances  in  the projection  have a  minimal
//deformation: we are looking for a k-dimensional subspace
//such that the squares of the distances in the projection
//is  as  big  as  possible  (in  fact  in  a  projection,
//distances can only stretch).  In other words, inertia of
//the projection  onto the k dimensional  subspace must be
//maximal.
//

//References: Saporta, Gilbert, Probabilites,  Analyse des
//Donnees et Statistique, Editions Technip, Paris, 1990.
//
//derived from pca, 
//  author: carlos klimann
//
  if argn(2)<2 then eco=%f,end
  if type(eco)<>4 then 
    error(msprintf(_("%s: Wrong type for input argument #%d: Boolean expected."),"princomp",2))
  end
  
  if x==[] then
    facpr=[];
    comprinc=[];
    lambda=[];
    tsquare=[];
    return; 
  end

  [rowx,colx]=size(x)

  //center data
  y=center(x,1)
 
  //compute eigenvectors of  y'*y using svd
  if eco then
    [U,lambda,facpr]=svd(y,"e");
  else
    [U,lambda,facpr]=svd(y);
  end
  lambda=diag(lambda).^2/(rowx-1);//normalize
  comprinc=y*facpr
  if rowx <= colx then
    if eco then
      lambda(rowx)=[]
      facpr(:,rowx)=[];
      comprinc(:,rowx) = [];
    else
      lambda(rowx:$)=[]
      comprinc(:,rowx:$) = [];
    end
  end
  q=find(lambda<=max(rowx,colx)*%eps*lambda(1),1)
  if q==[] then q=size(lambda,'*'),end
  tsquare=(rowx-1)*sum(U(:,1:q).^2,2)
endfunction