File: StdDataSet.h

package info (click to toggle)
torch 2-1
  • links: PTS
  • area: main
  • in suites: woody
  • size: 5,488 kB
  • ctags: 3,217
  • sloc: cpp: 14,272; makefile: 201
file content (107 lines) | stat: -rw-r--r-- 2,844 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
// Copyright (C) 2002 Ronan Collobert (collober@iro.umontreal.ca)
//                
//
// This file is part of Torch. Release II.
// [The Ultimate Machine Learning Library]
//
// Torch is free software; you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation; either version 2 of the License, or
// (at your option) any later version.
//
// Torch is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with Torch; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

#ifndef STD_DATA_SET_INC
#define STD_DATA_SET_INC

#include "EuclideanDataSet.h"
#include "normalize.h"

namespace Torch {

/** Standard Data Set.

    DataSet with a vector of reals for inputs,
    and a vector of real for targets.
    
    This DataSet support normalization with mean/variance.

    Options:
    \begin{tabular}{lcll}
      "normalize inputs"  &  bool &   normalize the inputs by mean/stdv  & [false]\\
      "normalize targets" &  bool &   normalize the targets by mean/stdv & [false]
    \end{tabular}

    @author Ronan Collobert (collober@iro.umontreal.ca)
*/
class StdDataSet : public EuclideanDataSet
{
  public:
    /// The inputs table.
    real **all_inputs;

    /// The targets table.
    real **all_targets;

    bool norm_inputs;
    bool norm_targets;
    real *mean_i;
    real *mean_o;
    real *stdv_i;
    real *stdv_o;

    //-----

    ///
    StdDataSet();

    /** Normalize the #StdDataSet# using the normalization values
        of another #StdDataSet#. If the other dataset is not normalize,
        nothing will be done.

        Call it AFTER #init()#.
    */
    virtual void normalizeUsingDataSet(StdDataSet *data_norm);

    /** Set the inputs and the targets to a user tabular
        #n_dim# is the dimension of inputs vectors
        #n_targets_# is the dimension of targets vectors.

        Call them BEFORE #init()#.
    */
    void setInputs(real **data_, int n_dim, int n_examples_);
    ///
    void setTargets(real **y_, int n_targets_);

    /// Load the normalization parameters
    virtual void loadFILE(FILE *file);

    /// Save the normalization parameters
    virtual void saveFILE(FILE *file);

    //-----

    virtual void setRealExample(int t);
    virtual real realRealDotProduct(int i, int j);
    virtual real realDotProduct(int i, List *y);
    virtual real dotProduct(List *x, List *y);

    //-----

    virtual void init();
    virtual void normalize();

    virtual ~StdDataSet();
};


}

#endif