File: simple.c

package info (click to toggle)
pocketsphinx 5.0.4-2
  • links: PTS, VCS
  • area: main
  • in suites:
  • size: 51,236 kB
  • sloc: ansic: 54,519; python: 2,438; sh: 566; cpp: 410; perl: 342; yacc: 93; lex: 50; makefile: 30
file content (85 lines) | stat: -rw-r--r-- 2,562 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
/* Example of simple PocketSphinx recognition.
 *
 * MIT license (c) 2022, see LICENSE for more information.
 *
 * Author: David Huggins-Daines <dhdaines@gmail.com>
 */
/**
 * @example simple.c
 * @brief Simplest possible example of speech recognition in C.
 *
 * This file shows how to use PocketSphinx to recognize a single input
 * file.  To compile it, assuming you have built the library as in
 * \ref unix_install "these directions", you can run:
 *
 *     cmake --build build --target simple
 *
 * Alternately, if PocketSphinx is installed system-wide, you can run:
 *
 *     gcc -o simple simple.c $(pkg-config --libs --cflags pocketsphinx)
 *
 *
 */

#include <pocketsphinx.h>
#include <stdlib.h>

int
main(int argc, char *argv[])
{
    ps_decoder_t *decoder;
    ps_config_t *config;
    FILE *fh;
    short *buf;
    size_t len, nsamples;

    /* Look for a single audio file as input parameter. */
    if (argc < 2)
        E_FATAL("Usage: %s FILE\n");
    if ((fh = fopen(argv[1], "rb")) == NULL)
        E_FATAL_SYSTEM("Failed to open %s", argv[1]);

    /* Get the size of the input. */
    if (fseek(fh, 0, SEEK_END) < 0)
        E_FATAL_SYSTEM("Unable to find end of input file %s", argv[1]);
    len = ftell(fh);
    rewind(fh);

    /* Initialize configuration from input file. */
    config = ps_config_init(NULL);
    ps_default_search_args(config);
    if (ps_config_soundfile(config, fh, argv[1]) < 0)
        E_FATAL("Unsupported input file %s\n", argv[1]);
    if ((decoder = ps_init(config)) == NULL)
        E_FATAL("PocketSphinx decoder init failed\n");

    /* Allocate data (skipping header) */
    len -= ftell(fh);
    if ((buf = malloc(len)) == NULL)
        E_FATAL_SYSTEM("Unable to allocate %d bytes", len);
    /* Read input */
    nsamples = fread(buf, sizeof(buf[0]), len / sizeof(buf[0]), fh);
    if (nsamples != len / sizeof(buf[0]))
        E_FATAL_SYSTEM("Unable to read %d samples", len / sizeof(buf[0]));

    /* Recognize it! */
    if (ps_start_utt(decoder) < 0)
        E_FATAL("Failed to start processing\n");
    if (ps_process_raw(decoder, buf, nsamples, FALSE, TRUE) < 0)
        E_FATAL("ps_process_raw() failed\n");
    if (ps_end_utt(decoder) < 0)
        E_FATAL("Failed to end processing\n");

    /* Print the result */
    if (ps_get_hyp(decoder, NULL) != NULL)
        printf("%s\n", ps_get_hyp(decoder, NULL));

    /* Clean up */
    if (fclose(fh) < 0)
        E_FATAL_SYSTEM("Failed to close %s", argv[1]);
    free(buf);
    ps_free(decoder);
    ps_config_free(config);
        
    return 0;
}