1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
|
#include <iostream>
#include <string>
#include <simstring/simstring.h>
void retrieve(
simstring::reader& dbr,
const std::string& query,
int measure,
double threshold
)
{
// Retrieve similar strings into a string vector.
std::vector<std::string> xstrs;
dbr.retrieve(query, measure, threshold, std::back_inserter(xstrs));
// Output the retrieved strings separated by ", ".
for (int i = 0;i < (int)xstrs.size();++i) {
std::cout << (i != 0 ? ", " : "") << xstrs[i];
}
std::cout << std::endl;
}
int main(int argc, char *argv[])
{
// Create a SimString database with two person names.
simstring::ngram_generator gen(3, false);
simstring::writer_base<std::string> dbw(gen, "sample.db");
dbw.insert("Barack Hussein Obama II");
dbw.insert("James Gordon Brown");
dbw.close();
// Open the database for reading.
simstring::reader dbr;
dbr.open("sample.db");
retrieve(dbr, "Barack Obama", simstring::cosine, 0.6);
retrieve(dbr, "Gordon Brown", simstring::cosine, 0.6);
retrieve(dbr, "Obama", simstring::cosine, 0.6);
retrieve(dbr, "Obama", simstring::overlap, 1.0);
return 0;
}
|