-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathParser.cpp
85 lines (72 loc) · 1.59 KB
/
Parser.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
#include "Parser.h"
#include <iostream>
#include <sstream>
using namespace std;
string& BaseParser::getWord(int begin)
{
for (int i = 0; i < patterns.size(); i++)
{
if (begin < patterns[i].size())
return patterns[i][begin];
begin -= patterns[i].size() ;
}
}
int BaseParser::getNumber(int begin)
{
for (int i = 0; i < patterns.size(); i++)
{
if ( begin < patterns[i].size() )
return i;
begin -= patterns[i].size();
}
}
int BoundaryParser::utf8Size(uint8_t byte)
{
if ( ( byte & 0x80 ) == 0 )
return 1;
else if ( ( byte & 0xE0 ) == 0xC0 )
return 2;
else if ( ( byte & 0xF0 ) == 0xE0 )
return 3;
else if ( ( byte & 0xF8 ) == 0xF0 )
return 4;
}
void BoundaryParser::readInput()
{
int number = 0;
while ( cin.good() )
{
readFileCompletely(number);
number++;
}
}
void BoundaryParser::readFileCompletely(int number)
{
vector<string> file = vector<string>();
string word = "";
uint8_t c = 0;
while ( cin.good() )
{
c = cin.get();
if ( cin.good() )
{
//delimiter
if ( c == '\n' )
break;
int size = utf8Size(c);
word += c;
for (int i = 1; i < size; ++i)
{
c = cin.get();
word += c;
}
if ( !word.empty() )
{
file.push_back(word);
totalLength++;
word.clear();
}
}
}
patterns.push_back(file);
}