blob: 3b80fe3390e920b2894188c091c794f8638b2e50 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
|
// Copyright 2016 Yahoo Inc. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
/**
* @author Peter Boros
* @date 2004/08/20
* @version $Id$
* @file segmenter_test.cpp
* @brief Test for the Segmenter class
*
*/
#include <iostream>
#include <iomanip>
#include <vespa/fsa/segmenter.h>
using namespace fsa;
int main(int argc, char **argv)
{
FSA dict(argc>=2? argv[1] : "__testfsa__.__fsa__");
Segmenter segmenter(dict);
Segmenter::Segments segments;
const Segmenter::Segmentation *segmentation;
std::string text;
while(!std::cin.eof()){
getline(std::cin,text);
if(text.size()>3){
segmenter.segment(text,segments);
std::cout << "List of all segments:" << std::endl;
for(unsigned int i=0; i<segments.size(); i++){
std::cout << " "
<< segments.sgm(i) << ":" << segments.conn(i) << " ["
<< segments.beg(i) << "," << segments.end(i)-1 << "]"
<< std::endl;
}
segmentation=segments.segmentation(Segmenter::SEGMENTATION_WEIGHTED);
std::cout << "Weighted segmentation:" << std::endl << " ";
for(Segmenter::SegmentationConstIterator it=segmentation->begin();
it!=segmentation->end();++it){
std::cout << "(" << segments.sgm(*it) << ")";
}
std::cout << std::endl;
segmentation=segments.segmentation(Segmenter::SEGMENTATION_RIGHTMOST_LONGEST);
std::cout << "Rightmost-longest segmentation:" << std::endl << " ";
for(Segmenter::SegmentationConstIterator it=segmentation->begin();
it!=segmentation->end();++it){
std::cout << "(" << segments.sgm(*it) << ")";
}
std::cout << std::endl;
segmentation=segments.segmentation(Segmenter::SEGMENTATION_LEFTMOST_LONGEST);
std::cout << "Lefttmost-longest segmentation:" << std::endl << " ";
for(Segmenter::SegmentationConstIterator it=segmentation->begin();
it!=segmentation->end();++it){
std::cout << "(" << segments.sgm(*it) << ")";
}
std::cout << std::endl;
}
}
return 0;
}
|