File: IOHtk.h

package info (click to toggle)
torch 2-1
  • links: PTS
  • area: main
  • in suites: woody
  • size: 5,488 kB
  • ctags: 3,217
  • sloc: cpp: 14,272; makefile: 201
file content (125 lines) | stat: -rw-r--r-- 3,769 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
// Copyright (C) 2002 Johnny Mariethoz (Johnny.Mariethoz@idiap.ch)
//                and Samy Bengio (bengio@idiap.ch)
//                
//
// This file is part of Torch. Release II.
// [The Ultimate Machine Learning Library]
//
// Torch is free software; you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation; either version 2 of the License, or
// (at your option) any later version.
//
// Torch is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with Torch; if not, write to the Free Software
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

#ifndef IOHTK_INC
#define IOHTK_INC

#include "Object.h"

namespace Torch {

/// HTK File Header 
struct HTKhdr {              
    long  nSamples;
    long  sampPeriod;
    short sampSize;
    short sampKind;
};

#define BASEMASK  077         /* Mask to remove qualifiers */
#define HASENERGY  0100       /* _E log energy included */
#define HASNULLE   0200       /* _N absolute energy suppressed */
#define HASDELTA   0400       /* _D delta coef appended */
#define HASACCS   01000       /* _A acceleration coefs appended */
#define HASCOMPX  02000       /* _C is compressed */
#define HASZEROM  04000       /* _Z zero meaned */
#define HASCRCC  010000       /* _K has CRC check */
#define HASZEROC 020000       /* _0 0'th Cepstra included */
#define HASVQ    040000       /* _V has VQ index attached */


enum _BaseParmKind{
  WAVEFORM,            /* Raw speech waveform (handled by HWave) */
  LPC,LPREFC,LPCEPSTRA,LPDELCEP,   /* LP-based Coefficients */
  IREFC,                           /* Ref Coef in 16 bit form */
  MFCC,                            /* Mel-Freq Cepstra */
  FBANK,                           /* Log Filter Bank */
  MELSPEC,                         /* Mel-Freq Spectrum (Linear) */
  USER,                            /* Arbitrary user specified data */
  DISCRETE,                        /* Discrete VQ symbols (shorts) */
  ANON
};

typedef short ParmKind;          /* BaseParmKind + Qualifiers */


/** This class is used to read HTK objects (used for various datasets)
 *
 * @author Samy Bengio (bengio@idiap.ch)
 * @author Johnny Mariethoz (Johnny.Mariethoz@idiap.ch)
 */
class IOHtk : public Object
{
  public:
    
    /// the data itself
    real* data;

    /// number of columns in the data
    int n_cols;
    /// number of lines in the data
    int n_lines;

    /// kind of data
    char* kind;

    /// file name
    char* file_name;

		/// sampling period
		long samp_period;

    /** for each IOHtk object, specify the corresponding filename as well
        as the maximum number of examples to load
    */
    IOHtk(char* file,int max_load=-1);

		/** write data on HTK binary format on the specifing directory
		 */
		void write(char* dir_to_save=NULL);

   /** create a mask to remove energy and corresponding delta, delta-delta
		*/
		virtual void createMaskFromParam(bool* mask);

    virtual ~IOHtk();
    

    /// HTK source code 
    char* parmKind2Str(ParmKind kind, char *buf);
    ParmKind str2ParmKind(char *str);
    ParmKind baseParmKind(ParmKind kind);
    bool hasEnergy(ParmKind kind);
    bool hasDelta(ParmKind kind) ;
    bool hasAccs(ParmKind kind)  ;
    bool hasNulle(ParmKind kind) ;
    bool hasCompx(ParmKind kind) ;
    bool hasCrcc(ParmKind kind)  ;
    bool hasZerom(ParmKind kind) ;
    bool hasZeroc(ParmKind kind) ;
    bool hasVQ(ParmKind kind)    ;      
};

}

#endif