File: test_wordtokenizer_main.cpp

package info (click to toggle)
source-highlight 3.1.9-4.3
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 10,612 kB
  • sloc: cpp: 10,202; ansic: 9,521; sh: 4,582; makefile: 1,893; lex: 1,200; yacc: 1,021; javascript: 338; php: 213; perl: 211; awk: 98; erlang: 94; lisp: 90; java: 75; ruby: 69; python: 61; asm: 43; ada: 37; ml: 29; haskell: 27; xml: 23; cs: 11; sql: 8; tcl: 7; sed: 4
file content (56 lines) | stat: -rw-r--r-- 1,559 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#ifdef HAVE_CONFIG_H
#include "config.h"
#endif

#include <iostream>

#include "asserttestexit.h"
#include "srchilite/wordtokenizer.h"
#include "srchilite/tostringcollection.h"

using namespace std;
using namespace srchilite;

/*
 * We have to use 'std' namespaces because 'WordTokenizer::WordTokenizerResults::value_type'
 * is an std::pair<std::string, std::string> in disguise. We have to place 'operator<<()'
 * into the same namespace for ADL to work. Otherwise gcc-12 or clang-13 can't find the
 * overload.
 */
namespace std {

static ostream &operator <<(ostream &os, const WordTokenizer::WordTokenizerResults::value_type &);

ostream &operator <<(ostream &os, const WordTokenizer::WordTokenizerResults::value_type &token) {
    if (token.first.size()) {
        os << "space: \"" << token.first << "\"" << endl;
    } else {
        os << "word : \"" << token.second << "\"" << endl;
    }

    return os;
}

}

int main() {
    WordTokenizer::WordTokenizerResults tokens;

    WordTokenizer::tokenize(" Here  are\t \t some_words!", tokens);

    cout << "tokens: " << collectionToString(&tokens) << endl;

    WordTokenizer::WordTokenizerResults::const_iterator tok = tokens.begin();

    assertTrue(tok != tokens.end());
    assertEquals(" ", (tok++)->first);
    assertEquals("Here", (tok++)->second);
    assertEquals("  ", (tok++)->first);
    assertEquals("are", (tok++)->second);
    assertEquals("\t \t ", (tok++)->first);
    assertEquals("some_words!", (tok++)->second);

    cout << "test_wordtokenizer: SUCCESS" << endl;

    return 0;
}