1 /*
2  * Copyright 2017 Google Inc.
3  *
4  * Use of this source code is governed by a BSD-style license that can be
5  * found in the LICENSE file.
6  */
7 
8 #ifndef SKSL_NFASTATE
9 #define SKSL_NFASTATE
10 
11 #include <string>
12 #include <vector>
13 
14 #include "LexUtil.h"
15 
16 struct NFAState {
17     enum Kind {
18         // represents an accept state - if the NFA ends up in this state, we have successfully
19         // matched the token indicated by fData[0]
20         kAccept_Kind,
21         // matches the single character fChar
22         kChar_Kind,
23         // the regex '.'; matches any char but '\n'
24         kDot_Kind,
25         // a state which serves as a placeholder for the states indicated in fData. When we
26         // transition to this state, we instead transition to all of the fData states.
27         kRemapped_Kind,
28         // contains a list of true/false values in fData. fData[c] tells us whether we accept the
29         // character c.
30         kTable_Kind
31     };
32 
33     NFAState(Kind kind, std::vector<int> next)
34     : fKind(kind)
35     , fNext(std::move(next)) {}
36 
37     NFAState(char c, std::vector<int> next)
38     : fKind(kChar_Kind)
39     , fChar(c)
40     , fNext(std::move(next)) {}
41 
42     NFAState(std::vector<int> states)
43     : fKind(kRemapped_Kind)
44     , fData(std::move(states)) {}
45 
46     NFAState(bool inverse, std::vector<bool> accepts, std::vector<int> next)
47     : fKind(kTable_Kind)
48     , fInverse(inverse)
49     , fNext(std::move(next)) {
50         for (bool b : accepts) {
51             fData.push_back(b);
52         }
53     }
54 
55     NFAState(int token)
56     : fKind(kAccept_Kind) {
57         fData.push_back(token);
58     }
59 
60     bool accept(char c) const {
61         switch (fKind) {
62             case kAccept_Kind:
63                 return false;
64             case kChar_Kind:
65                 return c == fChar;
66             case kDot_Kind:
67                 return c != '\n';
68             case kTable_Kind: {
69                 bool value;
70                 if ((size_t) c < fData.size()) {
71                     value = fData[c];
72                 } else {
73                     value = false;
74                 }
75                 return value != fInverse;
76             }
77             default:
78                 ABORT("unreachable");
79         }
80     }
81 
82     std::string description() const {
83         switch (fKind) {
84             case kAccept_Kind:
85                 return "Accept(" + std::to_string(fData[0]) + ")";
86             case kChar_Kind: {
87                 std::string result = "Char('" + std::string(1, fChar) + "'";
88                 for (int v : fNext) {
89                     result += ", ";
90                     result += std::to_string(v);
91                 }
92                 result += ")";
93                 return result;
94             }
95             case kDot_Kind: {
96                 std::string result = "Dot(";
97                 const char* separator = "";
98                 for (int v : fNext) {
99                     result += separator;
100                     result += std::to_string(v);
101                     separator = ", ";
102                 }
103                 result += ")";
104                 return result;
105             }
106             case kRemapped_Kind: {
107                 std::string result = "Remapped(";
108                 const char* separator = "";
109                 for (int v : fData) {
110                     result += separator;
111                     result += std::to_string(v);
112                     separator = ", ";
113                 }
114                 result += ")";
115                 return result;
116             }
117             case kTable_Kind: {
118                 std::string result = std::string("Table(") + (fInverse ? "true" : "false") + ", [";
119                 const char* separator = "";
120                 for (int v : fData) {
121                     result += separator;
122                     result += v ? "true" : "false";
123                     separator = ", ";
124                 }
125                 result += "]";
126                 for (int n : fNext) {
127                     result += ", ";
128                     result += std::to_string(n);
129                 }
130                 result += ")";
131                 return result;
132             }
133             default:
134                 ABORT("unreachable");
135         }
136     }
137 
138     Kind fKind;
139 
140     char fChar = 0;
141 
142     bool fInverse = false;
143 
144     std::vector<int> fData;
145 
146     // states we transition to upon a succesful match from this state
147     std::vector<int> fNext;
148 };
149 
150 #endif
151