1 | // |
2 | // Copyright (C) 2002-2005 3Dlabs Inc. Ltd. |
3 | // Copyright (C) 2013 LunarG, Inc. |
4 | // |
5 | // All rights reserved. |
6 | // |
7 | // Redistribution and use in source and binary forms, with or without |
8 | // modification, are permitted provided that the following conditions |
9 | // are met: |
10 | // |
11 | // Redistributions of source code must retain the above copyright |
12 | // notice, this list of conditions and the following disclaimer. |
13 | // |
14 | // Redistributions in binary form must reproduce the above |
15 | // copyright notice, this list of conditions and the following |
16 | // disclaimer in the documentation and/or other materials provided |
17 | // with the distribution. |
18 | // |
19 | // Neither the name of 3Dlabs Inc. Ltd. nor the names of its |
20 | // contributors may be used to endorse or promote products derived |
21 | // from this software without specific prior written permission. |
22 | // |
23 | // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
24 | // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
25 | // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS |
26 | // FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE |
27 | // COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, |
28 | // INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, |
29 | // BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |
30 | // LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER |
31 | // CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT |
32 | // LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN |
33 | // ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE |
34 | // POSSIBILITY OF SUCH DAMAGE. |
35 | // |
36 | #ifndef _GLSLANG_SCAN_INCLUDED_ |
37 | #define _GLSLANG_SCAN_INCLUDED_ |
38 | |
39 | #include "Versions.h" |
40 | |
41 | namespace glslang { |
42 | |
43 | // Use a global end-of-input character, so no translation is needed across |
44 | // layers of encapsulation. Characters are all 8 bit, and positive, so there is |
45 | // no aliasing of character 255 onto -1, for example. |
46 | const int EndOfInput = -1; |
47 | |
48 | // |
49 | // A character scanner that seamlessly, on read-only strings, reads across an |
50 | // array of strings without assuming null termination. |
51 | // |
52 | class TInputScanner { |
53 | public: |
54 | TInputScanner(int n, const char* const s[], size_t L[], const char* const* names = nullptr, |
55 | int b = 0, int f = 0, bool single = false) : |
56 | numSources(n), |
57 | // up to this point, common usage is "char*", but now we need positive 8-bit characters |
58 | sources(reinterpret_cast<const unsigned char* const *>(s)), |
59 | lengths(L), currentSource(0), currentChar(0), stringBias(b), finale(f), singleLogical(single), |
60 | endOfFileReached(false) |
61 | { |
62 | loc = new TSourceLoc[numSources]; |
63 | for (int i = 0; i < numSources; ++i) { |
64 | loc[i].init(i - stringBias); |
65 | } |
66 | if (names != nullptr) { |
67 | for (int i = 0; i < numSources; ++i) |
68 | loc[i].name = names[i] != nullptr ? NewPoolTString(names[i]) : nullptr; |
69 | } |
70 | loc[currentSource].line = 1; |
71 | logicalSourceLoc.init(1); |
72 | logicalSourceLoc.name = loc[0].name; |
73 | } |
74 | |
75 | virtual ~TInputScanner() |
76 | { |
77 | delete [] loc; |
78 | } |
79 | |
80 | // retrieve the next character and advance one character |
81 | int get() |
82 | { |
83 | int ret = peek(); |
84 | if (ret == EndOfInput) |
85 | return ret; |
86 | ++loc[currentSource].column; |
87 | ++logicalSourceLoc.column; |
88 | if (ret == '\n') { |
89 | ++loc[currentSource].line; |
90 | ++logicalSourceLoc.line; |
91 | logicalSourceLoc.column = 0; |
92 | loc[currentSource].column = 0; |
93 | } |
94 | advance(); |
95 | |
96 | return ret; |
97 | } |
98 | |
99 | // retrieve the next character, no advance |
100 | int peek() |
101 | { |
102 | if (currentSource >= numSources) { |
103 | endOfFileReached = true; |
104 | return EndOfInput; |
105 | } |
106 | // Make sure we do not read off the end of a string. |
107 | // N.B. Sources can have a length of 0. |
108 | int sourceToRead = currentSource; |
109 | size_t charToRead = currentChar; |
110 | while(charToRead >= lengths[sourceToRead]) { |
111 | charToRead = 0; |
112 | sourceToRead += 1; |
113 | if (sourceToRead >= numSources) { |
114 | return EndOfInput; |
115 | } |
116 | } |
117 | |
118 | // Here, we care about making negative valued characters positive |
119 | return sources[sourceToRead][charToRead]; |
120 | } |
121 | |
122 | // go back one character |
123 | void unget() |
124 | { |
125 | // Do not roll back once we've reached the end of the file. |
126 | if (endOfFileReached) |
127 | return; |
128 | |
129 | if (currentChar > 0) { |
130 | --currentChar; |
131 | --loc[currentSource].column; |
132 | --logicalSourceLoc.column; |
133 | if (loc[currentSource].column < 0) { |
134 | // We've moved back past a new line. Find the |
135 | // previous newline (or start of the file) to compute |
136 | // the column count on the now current line. |
137 | size_t chIndex = currentChar; |
138 | while (chIndex > 0) { |
139 | if (sources[currentSource][chIndex] == '\n') { |
140 | break; |
141 | } |
142 | --chIndex; |
143 | } |
144 | logicalSourceLoc.column = (int)(currentChar - chIndex); |
145 | loc[currentSource].column = (int)(currentChar - chIndex); |
146 | } |
147 | } else { |
148 | do { |
149 | --currentSource; |
150 | } while (currentSource > 0 && lengths[currentSource] == 0); |
151 | if (lengths[currentSource] == 0) { |
152 | // set to 0 if we've backed up to the start of an empty string |
153 | currentChar = 0; |
154 | } else |
155 | currentChar = lengths[currentSource] - 1; |
156 | } |
157 | if (peek() == '\n') { |
158 | --loc[currentSource].line; |
159 | --logicalSourceLoc.line; |
160 | } |
161 | } |
162 | |
163 | // for #line override |
164 | void setLine(int newLine) |
165 | { |
166 | logicalSourceLoc.line = newLine; |
167 | loc[getLastValidSourceIndex()].line = newLine; |
168 | } |
169 | |
170 | // for #line override in filename based parsing |
171 | void setFile(const char* filename) |
172 | { |
173 | TString* fn_tstr = NewPoolTString(filename); |
174 | logicalSourceLoc.name = fn_tstr; |
175 | loc[getLastValidSourceIndex()].name = fn_tstr; |
176 | } |
177 | |
178 | void setFile(const char* filename, int i) |
179 | { |
180 | TString* fn_tstr = NewPoolTString(filename); |
181 | if (i == getLastValidSourceIndex()) { |
182 | logicalSourceLoc.name = fn_tstr; |
183 | } |
184 | loc[i].name = fn_tstr; |
185 | } |
186 | |
187 | void setString(int newString) |
188 | { |
189 | logicalSourceLoc.string = newString; |
190 | loc[getLastValidSourceIndex()].string = newString; |
191 | logicalSourceLoc.name = nullptr; |
192 | loc[getLastValidSourceIndex()].name = nullptr; |
193 | } |
194 | |
195 | // for #include content indentation |
196 | void setColumn(int col) |
197 | { |
198 | logicalSourceLoc.column = col; |
199 | loc[getLastValidSourceIndex()].column = col; |
200 | } |
201 | |
202 | void setEndOfInput() |
203 | { |
204 | endOfFileReached = true; |
205 | currentSource = numSources; |
206 | } |
207 | |
208 | bool atEndOfInput() const { return endOfFileReached; } |
209 | |
210 | const TSourceLoc& getSourceLoc() const |
211 | { |
212 | if (singleLogical) { |
213 | return logicalSourceLoc; |
214 | } else { |
215 | return loc[std::max(0, std::min(currentSource, numSources - finale - 1))]; |
216 | } |
217 | } |
218 | // Returns the index (starting from 0) of the most recent valid source string we are reading from. |
219 | int getLastValidSourceIndex() const { return std::min(currentSource, numSources - 1); } |
220 | |
221 | void consumeWhiteSpace(bool& foundNonSpaceTab); |
222 | bool (); |
223 | void (bool& foundNonSpaceTab); |
224 | bool scanVersion(int& version, EProfile& profile, bool& notFirstToken); |
225 | |
226 | protected: |
227 | |
228 | // advance one character |
229 | void advance() |
230 | { |
231 | ++currentChar; |
232 | if (currentChar >= lengths[currentSource]) { |
233 | ++currentSource; |
234 | if (currentSource < numSources) { |
235 | loc[currentSource].string = loc[currentSource - 1].string + 1; |
236 | loc[currentSource].line = 1; |
237 | loc[currentSource].column = 0; |
238 | } |
239 | while (currentSource < numSources && lengths[currentSource] == 0) { |
240 | ++currentSource; |
241 | if (currentSource < numSources) { |
242 | loc[currentSource].string = loc[currentSource - 1].string + 1; |
243 | loc[currentSource].line = 1; |
244 | loc[currentSource].column = 0; |
245 | } |
246 | } |
247 | currentChar = 0; |
248 | } |
249 | } |
250 | |
251 | int numSources; // number of strings in source |
252 | const unsigned char* const *sources; // array of strings; must be converted to positive values on use, to avoid aliasing with -1 as EndOfInput |
253 | const size_t *lengths; // length of each string |
254 | int currentSource; |
255 | size_t currentChar; |
256 | |
257 | // This is for reporting what string/line an error occurred on, and can be overridden by #line. |
258 | // It remembers the last state of each source string as it is left for the next one, so unget() |
259 | // can restore that state. |
260 | TSourceLoc* loc; // an array |
261 | |
262 | int stringBias; // the first string that is the user's string number 0 |
263 | int finale; // number of internal strings after user's last string |
264 | |
265 | TSourceLoc logicalSourceLoc; |
266 | bool singleLogical; // treats the strings as a single logical string. |
267 | // locations will be reported from the first string. |
268 | |
269 | // Set to true once peek() returns EndOfFile, so that we won't roll back |
270 | // once we've reached EndOfFile. |
271 | bool endOfFileReached; |
272 | }; |
273 | |
274 | } // end namespace glslang |
275 | |
276 | #endif // _GLSLANG_SCAN_INCLUDED_ |
277 | |