-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathlexing.cpp
123 lines (117 loc) · 2.8 KB
/
lexing.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
#include "includes/lexing.h"
#include <ctype.h>
#include "includes/token.h"
#include <fstream>
char *tmp;
char *end_;
int currentLine = 1;
void DFAReserved()
{
string tmpstr = "";
while (*tmp == '_' || isalpha(*tmp) || isdigit(*tmp))
{
tmpstr += *tmp;
tmp++;
}
if (reservedMap.find(tmpstr) != reservedMap.end())
{
token::tokens.push_back( new token(tmpstr, reservedMap[tmpstr], currentLine));
return;
}
else
{
token::tokens.push_back(new token(tmpstr, IDENFR, currentLine));
return;
}
}
void DFASymbols()
{
string tmpstr = "";
if (tmp + 1 < end_)
{
if (*tmp == '&' && *(tmp + 1) == '&')
{
token::tokens.push_back(new token("&&", AND, currentLine));
tmp+=2;
return;
}
else if (*tmp == '|' && *(tmp + 1) == '|')
{
token::tokens.push_back(new token("||", OR, currentLine));tmp+=2;
return;
}
else if (*tmp == '<' && *(tmp + 1) == '=')
{
token::tokens.push_back(new token("<=", LEQ, currentLine));tmp+=2;
return;
}
else if (*tmp == '>' && *(tmp + 1) == '=')
{
token::tokens.push_back(new token(">=", GEQ, currentLine));tmp+=2;
return;
}
else if (*tmp == '=' && *(tmp + 1) == '=')
{
token::tokens.push_back(new token("==", EQL, currentLine));tmp+=2;
return;
}
else if (*tmp == '!' && *(tmp + 1) == '=')
{
token::tokens.push_back(new token("!=", NEQ, currentLine));tmp+=2;
return;
}
}
tmpstr+=*tmp;
token::tokens.push_back(new token(tmpstr, charMap[*tmp], currentLine));
tmp+=1;
}
void DFAFormatString()
{
string tmpstr = "";
tmpstr += "\"";
tmp++;
while (*tmp != '"')
{
tmpstr += *tmp;
tmp++;
}
tmpstr += *tmp;
tmp++;
token::tokens.push_back(new token(tmpstr, STRCON, currentLine));
}
void DFAIntConst()
{
int ans = 0;
ans += *tmp - '0';
tmp++;
while (isdigit(*tmp))
{
ans = ans * 10 + *tmp-'0';
tmp++;
}
token::tokens.push_back(new token(to_string(ans), INTCON, currentLine)); //草 为什么不用new
}
void DFA(std::string raw)
{
int len = raw.length();
tmp = &(raw[0]);
end_ = &(raw[0]) + len;
while (tmp - &raw[0] < len)
{
if (*tmp == ' ' || *tmp == '\t')
tmp++;
else if (*tmp == '\n')
{
tmp++;
currentLine++;
}
else if (isdigit(*tmp))
DFAIntConst();
else if (isalpha(*tmp) || *tmp == '_')
DFAReserved();
else if (*tmp == '"')
DFAFormatString();
else
DFASymbols();
}
}