1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57
|
// https://www.boost.org/doc/libs/1_67_0/libs/locale/doc/html/boundary_8cpp-example.html
//
// Copyright (c) 2009-2011 Artyom Beilis (Tonkikh)
//
// Distributed under the Boost Software License, Version 1.0. (See
// accompanying file LICENSE_1_0.txt or copy at
// http://www.boost.org/LICENSE_1_0.txt)
//
#include <boost/locale.hpp>
#include <cassert>
#include <ctime>
#include <iostream>
int main() {
using namespace boost::locale;
using namespace std;
generator gen;
// Make system default locale global
std::locale loc = gen("");
locale::global(loc);
cout.imbue(loc);
string text = "Hello World! あにま! Linux2.6 and Windows7 is word and "
"number. שָלוֹם עוֹלָם!";
cout << text << endl;
boundary::ssegment_index index(boundary::word, text.begin(), text.end());
boundary::ssegment_index::iterator p, e;
for (p = index.begin(), e = index.end(); p != e; ++p) {
cout << "Part [" << *p << "] has ";
if (p->rule() & boundary::word_number)
cout << "number(s) ";
if (p->rule() & boundary::word_letter)
cout << "letter(s) ";
if (p->rule() & boundary::word_kana)
cout << "kana character(s) ";
if (p->rule() & boundary::word_ideo)
cout << "ideographic character(s) ";
if (p->rule() & boundary::word_none)
cout << "no word characters";
cout << endl;
}
index.map(boundary::character, text.begin(), text.end());
for (p = index.begin(), e = index.end(); p != e; ++p) {
cout << "|" << *p;
}
cout << "|\n\n";
index.map(boundary::line, text.begin(), text.end());
for (p = index.begin(), e = index.end(); p != e; ++p) {
cout << "|" << *p;
}
cout << "|\n\n";
index.map(boundary::sentence, text.begin(), text.end());
for (p = index.begin(), e = index.end(); p != e; ++p) {
cout << "|" << *p;
}
cout << "|\n\n";
}
|