LexJAVA.cxx source code [DeepinIDE/3rdparty/unioncode-scintilla515/lexilla/lexers/LexJAVA.cxx]

1	// Scintilla source code edit control
2	/* @file LexJAVA.cxx*
3	** Lexer for C++, C, Java, and JavaScript.
4	** Further folding features and configuration properties added by "Udo Lechner" <dlchnr(at)gmx(dot)net>
5	**/
6	// Copyright 1998-2005 by Neil Hodgson <neilh@scintilla.org>
7	// The License.txt file describes the conditions under which this software may be distributed.
8
9	#include <cstdlib>
10	#include <cassert>
11	#include <cstring>
12
13	#include <utility>
14	#include <string>
15	#include <string_view>
16	#include <vector>
17	#include <map>
18	#include <algorithm>
19	#include <iterator>
20	#include <functional>
21
22	#include "ILexer.h"
23	#include "Scintilla.h"
24	#include "SciLexer.h"
25
26	#include "StringCopy.h"
27	#include "WordList.h"
28	#include "LexAccessor.h"
29	#include "Accessor.h"
30	#include "StyleContext.h"
31	#include "CharacterSet.h"
32	#include "LexerModule.h"
33	#include "OptionSet.h"
34	#include "SparseState.h"
35	#include "SubStyles.h"
36
37	using namespace Scintilla;
38	using namespace Lexilla;
39
40	namespace {
41	// Use an unnamed namespace to protect the functions and classes from name conflicts
42
43	constexpr bool IsSpaceEquiv(int state) noexcept {
44	return (state <= SCE_JAVA_COMMENTDOC) \|\|
45	// including SCE_JAVA_DEFAULT, SCE_JAVA_COMMENT, SCE_JAVA_COMMENTLINE
46	(state == SCE_JAVA_COMMENTLINEDOC) \|\| (state == SCE_JAVA_COMMENTDOCKEYWORD) \|\|
47	(state == SCE_JAVA_COMMENTDOCKEYWORDERROR);
48	}
49
50	// Preconditions: sc.currentPos points to a character after '+' or '-'.
51	// The test for pos reaching 0 should be redundant,
52	// and is in only for safety measures.
53	// Limitation: this code will give the incorrect answer for code like
54	// a = b+++/ptn/...
55	// Putting a space between the '++' post-inc operator and the '+' binary op
56	// fixes this, and is highly recommended for readability anyway.
57	bool FollowsPostfixOperator(const StyleContext &sc, LexAccessor &styler) {
58	Sci_Position pos = sc.currentPos;
59	while (--pos > `0`) {
60	const char ch = styler [pos];
61	if (ch == `'+'` \|\| ch == `'-'`) {
62	return styler [pos - `1`] == ch;
63	}
64	}
65	return false;
66	}
67
68	bool followsReturnKeyword(const StyleContext &sc, LexAccessor &styler) {
69	// Don't look at styles, so no need to flush.
70	Sci_Position pos = sc.currentPos;
71	const Sci_Position currentLine = styler.GetLine(pos);
72	const Sci_Position lineStartPos = styler.LineStart(currentLine);
73	while (--pos > lineStartPos) {
74	const char ch = styler.SafeGetCharAt(pos);
75	if (ch != `' '` && ch != `'\t'`) {
76	break;
77	}
78	}
79	const char *retBack = "nruter";
80	const char *s = retBack;
81	while (*s
82	&& pos >= lineStartPos
83	&& styler.SafeGetCharAt(pos) == *s) {
84	s++;
85	pos--;
86	}
87	return !*s;
88	}
89
90	constexpr bool IsSpaceOrTab(int ch) noexcept {
91	return ch == `' '` \|\| ch == `'\t'`;
92	}
93
94	bool OnlySpaceOrTab(const std::string &s) noexcept {
95	for (const char ch : s) {
96	if (!IsSpaceOrTab(ch))
97	return false;
98	}
99	return true;
100	}
101
102	std::vector<std::string> StringSplit(const std::string &text, int separator) {
103	std::vector<std::string> vs(text.empty() ? `0` : `1`);
104	for (const char ch : text) {
105	if (ch == separator) {
106	vs.emplace_back();
107	} else {
108	vs.back() += ch;
109	}
110	}
111	return vs;
112	}
113
114	struct BracketPair {
115	std::vector<std::string>::iterator itBracket;
116	std::vector<std::string>::iterator itEndBracket;
117	};
118
119	BracketPair FindBracketPair(std::vector<std::string> &tokens) {
120	BracketPair bp;
121	std::vector<std::string>::iterator itTok = std::find(tokens.begin(), tokens.end(), "(");
122	bp.itBracket = tokens.end();
123	bp.itEndBracket = tokens.end();
124	if (itTok != tokens.end()) {
125	bp.itBracket = itTok;
126	size_t nest = `0`;
127	while (itTok != tokens.end()) {
128	if (*itTok == "(") {
129	nest++;
130	} else if (*itTok == ")") {
131	nest--;
132	if (nest == `0`) {
133	bp.itEndBracket = itTok;
134	return bp;
135	}
136	}
137	++itTok;
138	}
139	}
140	bp.itBracket = tokens.end();
141	return bp;
142	}
143
144	void highlightTaskMarker(StyleContext &sc, LexAccessor &styler,
145	int activity, const WordList &markerList, bool caseSensitive){
146	if ((isoperator(sc.chPrev) \|\| IsASpace(sc.chPrev)) && markerList.Length()) {
147	constexpr Sci_PositionU lengthMarker = `50`;
148	char marker[lengthMarker+`1`] = "";
149	const Sci_PositionU currPos = sc.currentPos;
150	Sci_PositionU i = `0`;
151	while (i < lengthMarker) {
152	const char ch = styler.SafeGetCharAt(currPos + i);
153	if (IsASpace(ch) \|\| isoperator(ch)) {
154	break;
155	}
156	if (caseSensitive)
157	marker[i] = ch;
158	else
159	marker[i] = MakeLowerCase(ch);
160	i++;
161	}
162	marker[i] = `'\0'`;
163	if (markerList.InList(marker)) {
164	sc.SetState(SCE_JAVA_TASKMARKER\|activity);
165	}
166	}
167	}
168
169	class EscapeSequence {
170	const CharacterSet setHexDigits = CharacterSet (CharacterSet::setDigits, "ABCDEFabcdef");
171	const CharacterSet setOctDigits = CharacterSet (CharacterSet::setNone, "01234567");
172	const CharacterSet setNoneNumeric;
173	const CharacterSet escapeSetValid = nullptr*;
174	int digitsLeft = `0`;
175	public:
176	EscapeSequence() = default;
177	void resetEscapeState(int nextChar) {
178	digitsLeft = `0`;
179	escapeSetValid = &setNoneNumeric;
180	if (nextChar == `'U'`) {
181	digitsLeft = `9`;
182	escapeSetValid = &setHexDigits;
183	} else if (nextChar == `'u'`) {
184	digitsLeft = `5`;
185	escapeSetValid = &setHexDigits;
186	} else if (nextChar == `'x'`) {
187	digitsLeft = `5`;
188	escapeSetValid = &setHexDigits;
189	} else if (setOctDigits.Contains(nextChar)) {
190	digitsLeft = `3`;
191	escapeSetValid = &setOctDigits;
192	}
193	}
194	bool atEscapeEnd(int currChar) const {
195	return (digitsLeft <= `0`) \|\| !escapeSetValid->Contains(currChar);
196	}
197	void consumeDigit() noexcept {
198	digitsLeft--;
199	}
200	};
201
202	std::string GetRestOfLine(LexAccessor &styler, Sci_Position start, bool allowSpace) {
203	std::string restOfLine;
204	Sci_Position line = styler.GetLine(start);
205	Sci_Position pos = start;
206	Sci_Position endLine = styler.LineEnd(line);
207	char ch = styler.SafeGetCharAt(start, `'\n'`);
208	while (pos < endLine) {
209	if (ch == `'\\'` && ((pos + `1`) == endLine)) {
210	// Continuation line
211	line++;
212	pos = styler.LineStart(line);
213	endLine = styler.LineEnd(line);
214	ch = styler.SafeGetCharAt(pos, `'\n'`);
215	} else {
216	const char chNext = styler.SafeGetCharAt(pos + `1`, `'\n'`);
217	if (ch == `'/'` && (chNext == `'/'` \|\| chNext == `'*'`))
218	break;
219	if (allowSpace \|\| (ch != `' '`)) {
220	restOfLine += ch;
221	}
222	pos++;
223	ch = chNext;
224	}
225	}
226	return restOfLine;
227	}
228
229	constexpr bool IsStreamCommentStyle(int style) noexcept {
230	return style == SCE_JAVA_COMMENT \|\|
231	style == SCE_JAVA_COMMENTDOC \|\|
232	style == SCE_JAVA_COMMENTDOCKEYWORD \|\|
233	style == SCE_JAVA_COMMENTDOCKEYWORDERROR;
234	}
235
236	struct PPDefinition {
237	Sci_Position line;
238	std::string key;
239	std::string value;
240	bool isUndef;
241	std::string arguments;
242	PPDefinition(Sci_Position line_, const std::string &key_, const std::string &value_, bool isUndef_ = false, const std::string &arguments_="") :
243	line(line_), key (key_), value (value_), isUndef(isUndef_), arguments (arguments_) {
244	}
245	};
246
247	constexpr int inactiveFlag = `0x40`;
248
249	class LinePPState {
250	// Track the state of preprocessor conditionals to allow showing active and inactive
251	// code in different styles.
252	// Only works up to 31 levels of conditional nesting.
253
254	// state is a bit mask with 1 bit per level
255	// bit is 1 for level if section inactive, so any bits set = inactive style
256	int state = `0`;
257	// ifTaken is a bit mask with 1 bit per level
258	// bit is 1 for level if some branch at this level has been taken
259	int ifTaken = `0`;
260	// level is the nesting level of #if constructs
261	int level = -`1`;
262	static const int maximumNestingLevel = `31`;
263	int maskLevel() const noexcept {
264	if (level >= `0`) {
265	return `1` << level;
266	} else {
267	return `1`;
268	}
269	}
270	public:
271	LinePPState() noexcept {
272	}
273	bool ValidLevel() const noexcept {
274	return level >= `0` && level < maximumNestingLevel;
275	}
276	bool IsActive() const noexcept {
277	return state == `0`;
278	}
279	bool IsInactive() const noexcept {
280	return state != `0`;
281	}
282	int ActiveState() const noexcept {
283	return state ? inactiveFlag : `0`;
284	}
285	bool CurrentIfTaken() const noexcept {
286	return (ifTaken & maskLevel()) != `0`;
287	}
288	void StartSection(bool on) noexcept {
289	level++;
290	if (ValidLevel()) {
291	if (on) {
292	state &= ~maskLevel();
293	ifTaken \|= maskLevel();
294	} else {
295	state \|= maskLevel();
296	ifTaken &= ~maskLevel();
297	}
298	}
299	}
300	void EndSection() noexcept {
301	if (ValidLevel()) {
302	state &= ~maskLevel();
303	ifTaken &= ~maskLevel();
304	}
305	level--;
306	}
307	void InvertCurrentLevel() noexcept {
308	if (ValidLevel()) {
309	state ^= maskLevel();
310	ifTaken \|= maskLevel();
311	}
312	}
313	};
314
315	// Hold the preprocessor state for each line seen.
316	// Currently one entry per line but could become sparse with just one entry per preprocessor line.
317	class PPStates {
318	std::vector<LinePPState> vlls;
319	public:
320	LinePPState ForLine(Sci_Position line) const noexcept {
321	if ((line > `0`) && (vlls.size() > static_cast<size_t>(line))) {
322	return vlls [line];
323	} else {
324	return LinePPState ();
325	}
326	}
327	void Add(Sci_Position line, LinePPState lls) {
328	vlls.resize(line+`1`);
329	vlls [line] = lls;
330	}
331	};
332
333	// An individual named option for use in an OptionSet
334
335	// Options used for LexerJAVA
336	struct OptionsJAVA {
337	bool stylingWithinPreprocessor;
338	bool identifiersAllowDollars;
339	bool trackPreprocessor;
340	bool updatePreprocessor;
341	bool verbatimStringsAllowEscapes;
342	bool triplequotedStrings;
343	bool hashquotedStrings;
344	bool backQuotedStrings;
345	bool escapeSequence;
346	bool fold;
347	bool foldSyntaxBased;
348	bool foldComment;
349	bool foldCommentMultiline;
350	bool foldCommentExplicit;
351	std::string foldExplicitStart;
352	std::string foldExplicitEnd;
353	bool foldExplicitAnywhere;
354	bool foldPreprocessor;
355	bool foldPreprocessorAtElse;
356	bool foldCompact;
357	bool foldAtElse;
358	OptionsJAVA() {
359	stylingWithinPreprocessor = false;
360	identifiersAllowDollars = true;
361	trackPreprocessor = true;
362	updatePreprocessor = true;
363	verbatimStringsAllowEscapes = false;
364	triplequotedStrings = false;
365	hashquotedStrings = false;
366	backQuotedStrings = false;
367	escapeSequence = false;
368	fold = false;
369	foldSyntaxBased = true;
370	foldComment = false;
371	foldCommentMultiline = true;
372	foldCommentExplicit = true;
373	foldExplicitStart = "";
374	foldExplicitEnd = "";
375	foldExplicitAnywhere = false;
376	foldPreprocessor = false;
377	foldPreprocessorAtElse = false;
378	foldCompact = false;
379	foldAtElse = false;
380	}
381	};
382
383	const char *const javaWordLists[] = {
384	"Primary keywords and identifiers",
385	"Secondary keywords and identifiers",
386	"Documentation comment keywords",
387	"Global classes and typedefs",
388	"Preprocessor definitions",
389	"Task marker and error marker keywords",
390	nullptr,
391	};
392
393	struct OptionSetJAVA : public OptionSet<OptionsJAVA> {
394	OptionSetJAVA() {
395	DefineProperty("styling.within.preprocessor", &OptionsJAVA::stylingWithinPreprocessor,
396	"For C++ code, determines whether all preprocessor code is styled in the "
397	"preprocessor style (0, the default) or only from the initial # to the end "
398	"of the command word(1).");
399
400	DefineProperty("lexer.java.allow.dollars", &OptionsJAVA::identifiersAllowDollars,
401	"Set to 0 to disallow the '$' character in identifiers with the java lexer.");
402
403	DefineProperty("lexer.java.track.preprocessor", &OptionsJAVA::trackPreprocessor,
404	"Set to 1 to interpret #if/#else/#endif to grey out code that is not active.");
405
406	DefineProperty("lexer.java.update.preprocessor", &OptionsJAVA::updatePreprocessor,
407	"Set to 1 to update preprocessor definitions when #define found.");
408
409	DefineProperty("lexer.java.verbatim.strings.allow.escapes", &OptionsJAVA::verbatimStringsAllowEscapes,
410	"Set to 1 to allow verbatim strings to contain escape sequences.");
411
412	DefineProperty("lexer.java.triplequoted.strings", &OptionsJAVA::triplequotedStrings,
413	"Set to 1 to enable highlighting of triple-quoted strings.");
414
415	DefineProperty("lexer.java.hashquoted.strings", &OptionsJAVA::hashquotedStrings,
416	"Set to 1 to enable highlighting of hash-quoted strings.");
417
418	DefineProperty("lexer.java.backquoted.strings", &OptionsJAVA::backQuotedStrings,
419	"Set to 1 to enable highlighting of back-quoted raw strings .");
420
421	DefineProperty("lexer.java.escape.sequence", &OptionsJAVA::escapeSequence,
422	"Set to 1 to enable highlighting of escape sequences in strings");
423
424	DefineProperty("fold", &OptionsJAVA::fold);
425
426	DefineProperty("fold.java.syntax.based", &OptionsJAVA::foldSyntaxBased,
427	"Set this property to 0 to disable syntax based folding.");
428
429	DefineProperty("fold.comment", &OptionsJAVA::foldComment,
430	"This option enables folding multi-line comments and explicit fold points when using the Java lexer. "
431	"Explicit fold points allows adding extra folding by placing a //{ comment at the start and a //} "
432	"at the end of a section that should fold.");
433
434	DefineProperty("fold.java.comment.multiline", &OptionsJAVA::foldCommentMultiline,
435	"Set this property to 0 to disable folding multi-line comments when fold.comment=1.");
436
437	DefineProperty("fold.java.comment.explicit", &OptionsJAVA::foldCommentExplicit,
438	"Set this property to 0 to disable folding explicit fold points when fold.comment=1.");
439
440	DefineProperty("fold.java.explicit.start", &OptionsJAVA::foldExplicitStart,
441	"The string to use for explicit fold start points, replacing the standard //{.");
442
443	DefineProperty("fold.java.explicit.end", &OptionsJAVA::foldExplicitEnd,
444	"The string to use for explicit fold end points, replacing the standard //}.");
445
446	DefineProperty("fold.java.explicit.anywhere", &OptionsJAVA::foldExplicitAnywhere,
447	"Set this property to 1 to enable explicit fold points anywhere, not just in line comments.");
448
449	DefineProperty("fold.java.preprocessor.at.else", &OptionsJAVA::foldPreprocessorAtElse,
450	"This option enables folding on a preprocessor #else or #endif line of an #if statement.");
451
452	DefineProperty("fold.preprocessor", &OptionsJAVA::foldPreprocessor,
453	"This option enables folding preprocessor directives when using the Java lexer. "
454	"Includes C#'s explicit #region and #endregion folding directives.");
455
456	DefineProperty("fold.compact", &OptionsJAVA::foldCompact);
457
458	DefineProperty("fold.at.else", &OptionsJAVA::foldAtElse,
459	"This option enables Java folding on a \"} else {\" line of an if statement.");
460
461	DefineWordListSets(javaWordLists);
462	}
463	};
464
465	const char styleSubable[] = {SCE_JAVA_IDENTIFIER, SCE_JAVA_COMMENTDOCKEYWORD, `0`};
466
467	LexicalClass lexicalClasses[] = {
468	// Lexer Java SCLEX_JAVA SCE_JAVA_:
469	`0`, "SCE_JAVA_DEFAULT", "default", "White space",
470	`1`, "SCE_JAVA_COMMENT", "comment", "Comment: /* */.",
471	`2`, "SCE_JAVA_COMMENTLINE", "comment line", "Line Comment: //.",
472	`3`, "SCE_JAVA_COMMENTDOC", "comment documentation", "Doc comment: block comments beginning with /** or /*!",
473	`4`, "SCE_JAVA_NUMBER", "literal numeric", "Number",
474	`5`, "SCE_JAVA_WORD", "keyword", "Keyword",
475	`6`, "SCE_JAVA_STRING", "literal string", "Double quoted string",
476	`7`, "SCE_JAVA_CHARACTER", "literal string character", "Single quoted string",
477	`8`, "SCE_JAVA_UUID", "literal uuid", "UUIDs (only in IDL)",
478	`9`, "SCE_JAVA_PREPROCESSOR", "preprocessor", "Preprocessor",
479	`10`, "SCE_JAVA_OPERATOR", "operator", "Operators",
480	`11`, "SCE_JAVA_IDENTIFIER", "identifier", "Identifiers",
481	`12`, "SCE_JAVA_STRINGEOL", "error literal string", "End of line where string is not closed",
482	`13`, "SCE_JAVA_VERBATIM", "literal string multiline raw", "Verbatim strings for C#",
483	`14`, "SCE_JAVA_REGEX", "literal regex", "Regular expressions for JavaScript",
484	`15`, "SCE_JAVA_COMMENTLINEDOC", "comment documentation line", "Doc Comment Line: line comments beginning with /// or //!.",
485	`16`, "SCE_JAVA_WORD2", "identifier", "Keywords2",
486	`17`, "SCE_JAVA_COMMENTDOCKEYWORD", "comment documentation keyword", "Comment keyword",
487	`18`, "SCE_JAVA_COMMENTDOCKEYWORDERROR", "error comment documentation keyword", "Comment keyword error",
488	`19`, "SCE_JAVA_GLOBALCLASS", "identifier", "Global class",
489	`20`, "SCE_JAVA_STRINGRAW", "literal string multiline raw", "Raw strings for C++0x",
490	`21`, "SCE_JAVA_TRIPLEVERBATIM", "literal string multiline raw", "Triple-quoted strings for Vala",
491	`22`, "SCE_JAVA_HASHQUOTEDSTRING", "literal string", "Hash-quoted strings for Pike",
492	`23`, "SCE_JAVA_PREPROCESSORCOMMENT", "comment preprocessor", "Preprocessor stream comment",
493	`24`, "SCE_JAVA_PREPROCESSORCOMMENTDOC", "comment preprocessor documentation", "Preprocessor stream doc comment",
494	`25`, "SCE_JAVA_USERLITERAL", "literal", "User defined literals",
495	`26`, "SCE_JAVA_TASKMARKER", "comment taskmarker", "Task Marker",
496	`27`, "SCE_JAVA_ESCAPESEQUENCE", "literal string escapesequence", "Escape sequence",
497	};
498
499	const int sizeLexicalClasses = static_cast<int>(std::size(lexicalClasses));
500
501	}
502
503	class LexerJAVA : public ILexer5 {
504	bool caseSensitive;
505	CharacterSet setWord;
506	CharacterSet setNegationOp;
507	CharacterSet setAddOp;
508	CharacterSet setMultOp;
509	CharacterSet setRelOp;
510	CharacterSet setLogicalOp;
511	CharacterSet setWordStart;
512	PPStates vlls;
513	std::vector<PPDefinition> ppDefineHistory;
514	WordList keywords;
515	WordList keywords2;
516	WordList keywords3;
517	WordList keywords4;
518	WordList ppDefinitions;
519	WordList markerList;
520	struct SymbolValue {
521	std::string value;
522	std::string arguments;
523	SymbolValue() noexcept = default;
524	SymbolValue(const std::string &value_, const std::string &arguments_) : value (value_), arguments (arguments_) {
525	}
526	SymbolValue &operator = (const std::string &value_) {
527	value = value_;
528	arguments.clear();
529	return *this;
530	}
531	bool IsMacro() const noexcept {
532	return !arguments.empty();
533	}
534	};
535	typedef std::map<std::string, SymbolValue> SymbolTable;
536	SymbolTable preprocessorDefinitionsStart;
537	OptionsJAVA options;
538	OptionSetJAVA osJava;
539	EscapeSequence escapeSeq;
540	SparseState<std::string> rawStringTerminators;
541	enum { ssIdentifier, ssDocKeyword };
542	SubStyles subStyles;
543	std::string returnBuffer;
544	public:
545	explicit LexerJAVA(bool caseSensitive_) :
546	caseSensitive(caseSensitive_),
547	setWord (CharacterSet::setAlphaNum, "._", true),
548	setNegationOp (CharacterSet::setNone, "!"),
549	setAddOp (CharacterSet::setNone, "+-"),
550	setMultOp (CharacterSet::setNone, "*/%"),
551	setRelOp (CharacterSet::setNone, "=!<>"),
552	setLogicalOp (CharacterSet::setNone, "\|&"),
553	subStyles (styleSubable, `0x80`, `0x40`, inactiveFlag) {
554	}
555	// Deleted so LexerJAVA objects can not be copied.
556	LexerJAVA(const LexerJAVA &) = delete;
557	LexerJAVA(LexerJAVA &&) = delete;
558	void operator=(const LexerJAVA &) = delete;
559	void operator=(LexerJAVA &&) = delete;
560	virtual ~LexerJAVA() {
561	}
562	void SCI_METHOD Release() noexcept override {
563	delete this;
564	}
565	int SCI_METHOD Version() const noexcept override {
566	return lvRelease5;
567	}
568	const char * SCI_METHOD PropertyNames() override {
569	return osJava.PropertyNames();
570	}
571	int SCI_METHOD PropertyType(const char *name) override {
572	return osJava.PropertyType(name);
573	}
574	const char * SCI_METHOD DescribeProperty(const char *name) override {
575	return osJava.DescribeProperty(name);
576	}
577	Sci_Position SCI_METHOD PropertySet(const char key, const* char *val) override;
578	const char * SCI_METHOD DescribeWordListSets() override {
579	return osJava.DescribeWordListSets();
580	}
581	Sci_Position SCI_METHOD WordListSet(int n, const char *wl) override;
582	void SCI_METHOD Lex(Sci_PositionU startPos, Sci_Position length, int initStyle, IDocument *pAccess) override;
583	void SCI_METHOD Fold(Sci_PositionU startPos, Sci_Position length, int initStyle, IDocument *pAccess) override;
584
585	void * SCI_METHOD PrivateCall(int, void ) noexcept* override {
586	return nullptr;
587	}
588
589	int SCI_METHOD LineEndTypesSupported() noexcept override {
590	return SC_LINE_END_TYPE_UNICODE;
591	}
592
593	int SCI_METHOD AllocateSubStyles(int styleBase, int numberStyles) override {
594	return subStyles.Allocate(styleBase, numberStyles);
595	}
596	int SCI_METHOD SubStylesStart(int styleBase) override {
597	return subStyles.Start(styleBase);
598	}
599	int SCI_METHOD SubStylesLength(int styleBase) override {
600	return subStyles.Length(styleBase);
601	}
602	int SCI_METHOD StyleFromSubStyle(int subStyle) override {
603	const int styleBase = subStyles.BaseStyle(MaskActive(subStyle));
604	const int inactive = subStyle & inactiveFlag;
605	return styleBase \| inactive;
606	}
607	int SCI_METHOD PrimaryStyleFromStyle(int style) noexcept override {
608	return MaskActive(style);
609	}
610	void SCI_METHOD FreeSubStyles() override {
611	subStyles.Free();
612	}
613	void SCI_METHOD SetIdentifiers(int style, const char *identifiers) override {
614	subStyles.SetIdentifiers(style, identifiers);
615	}
616	int SCI_METHOD DistanceToSecondaryStyles() noexcept override {
617	return inactiveFlag;
618	}
619	const char * SCI_METHOD GetSubStyleBases() noexcept override {
620	return styleSubable;
621	}
622	int SCI_METHOD NamedStyles() override {
623	return std::max(subStyles.LastAllocated() + `1`,
624	sizeLexicalClasses) +
625	inactiveFlag;
626	}
627	const char * SCI_METHOD NameOfStyle(int style) override {
628	if (style >= NamedStyles())
629	return "";
630	if (style < sizeLexicalClasses)
631	return lexicalClasses[style].name;
632	// TODO: inactive and substyles
633	return "";
634	}
635	const char * SCI_METHOD TagsOfStyle(int style) override {
636	if (style >= NamedStyles())
637	return "Excess";
638	returnBuffer.clear();
639	const int firstSubStyle = subStyles.FirstAllocated();
640	if (firstSubStyle >= `0`) {
641	const int lastSubStyle = subStyles.LastAllocated();
642	if (((style >= firstSubStyle) && (style <= (lastSubStyle))) \|\|
643	((style >= firstSubStyle + inactiveFlag) && (style <= (lastSubStyle + inactiveFlag)))) {
644	int styleActive = style;
645	if (style > lastSubStyle) {
646	returnBuffer = "inactive ";
647	styleActive -= inactiveFlag;
648	}
649	const int styleMain = StyleFromSubStyle(styleActive);
650	returnBuffer += lexicalClasses[styleMain].tags;
651	return returnBuffer.c_str();
652	}
653	}
654	if (style < sizeLexicalClasses)
655	return lexicalClasses[style].tags;
656	if (style >= inactiveFlag) {
657	returnBuffer = "inactive ";
658	const int styleActive = style - inactiveFlag;
659	if (styleActive < sizeLexicalClasses)
660	returnBuffer += lexicalClasses[styleActive].tags;
661	else
662	returnBuffer = "";
663	return returnBuffer.c_str();
664	}
665	return "";
666	}
667	const char * SCI_METHOD DescriptionOfStyle(int style) override {
668	if (style >= NamedStyles())
669	return "";
670	if (style < sizeLexicalClasses)
671	return lexicalClasses[style].description;
672	// TODO: inactive and substyles
673	return "";
674	}
675
676	// ILexer5 methods
677	const char * SCI_METHOD GetName() override {
678	return caseSensitive ? "java" : "javanocase";
679	}
680	int SCI_METHOD GetIdentifier() override {
681	return caseSensitive ? SCLEX_JAVA : SCLEX_JAVANOCASE;
682	}
683	const char * SCI_METHOD PropertyGet(const char *key) override;
684
685	static ILexer5 *LexerFactoryJAVA() {
686	return new LexerJAVA (true);
687	}
688	static ILexer5 *LexerFactoryJAVAInsensitive() {
689	return new LexerJAVA (false);
690	}
691	constexpr static int MaskActive(int style) noexcept {
692	return style & ~inactiveFlag;
693	}
694	void EvaluateTokens(std::vector<std::string> &tokens, const SymbolTable &preprocessorDefinitions);
695	std::vector<std::string> Tokenize(const std::string &expr) const;
696	bool EvaluateExpression(const std::string &expr, const SymbolTable &preprocessorDefinitions);
697	};
698
699	Sci_Position SCI_METHOD LexerJAVA::PropertySet(const char key, const* char *val) {
700	if (osJava.PropertySet(&options, key, val)) {
701	if (strcmp(key, "lexer.java.allow.dollars") == `0`) {
702	setWord = CharacterSet (CharacterSet::setAlphaNum, "._", true);
703	if (options.identifiersAllowDollars) {
704	setWord.Add(`'$'`);
705	}
706	}
707	return `0`;
708	}
709	return -`1`;
710	}
711
712	const char * SCI_METHOD LexerJAVA::PropertyGet(const char *key) {
713	return osJava.PropertyGet(key);
714	}
715
716	Sci_Position SCI_METHOD LexerJAVA::WordListSet(int n, const char *wl) {
717	WordList wordListN = nullptr*;
718	switch (n) {
719	case `0`:
720	wordListN = &keywords;
721	break;
722	case `1`:
723	wordListN = &keywords2;
724	break;
725	case `2`:
726	wordListN = &keywords3;
727	break;
728	case `3`:
729	wordListN = &keywords4;
730	break;
731	case `4`:
732	wordListN = &ppDefinitions;
733	break;
734	case `5`:
735	wordListN = &markerList;
736	break;
737	}
738	Sci_Position firstModification = -`1`;
739	if (wordListN) {
740	WordList wlNew;
741	wlNew.Set(wl);
742	if (*wordListN != wlNew) {
743	wordListN->Set(wl);
744	firstModification = `0`;
745	if (n == `4`) {
746	// Rebuild preprocessorDefinitions
747	preprocessorDefinitionsStart.clear();
748	for (int nDefinition = `0`; nDefinition < ppDefinitions.Length(); nDefinition++) {
749	const char *cpDefinition = ppDefinitions.WordAt(nDefinition);
750	const char *cpEquals = strchr(cpDefinition, `'='`);
751	if (cpEquals) {
752	std::string name(cpDefinition, cpEquals - cpDefinition);
753	std::string val(cpEquals+`1`);
754	const size_t bracket = name.find(`'('`);
755	const size_t bracketEnd = name.find(`')'`);
756	if ((bracket != std::string::npos) && (bracketEnd != std::string::npos)) {
757	// Macro
758	std::string args = name.substr(bracket + `1`, bracketEnd - bracket - `1`);
759	name = name.substr(`0`, bracket);
760	preprocessorDefinitionsStart [name] = SymbolValue (val, args);
761	} else {
762	preprocessorDefinitionsStart [name] = val;
763	}
764	} else {
765	std::string name(cpDefinition);
766	std::string val("1");
767	preprocessorDefinitionsStart [name] = val;
768	}
769	}
770	}
771	}
772	}
773	return firstModification;
774	}
775
776	void SCI_METHOD LexerJAVA::Lex(Sci_PositionU startPos, Sci_Position length, int initStyle, IDocument *pAccess) {
777	LexAccessor styler(pAccess);
778
779	CharacterSet setOKBeforeRE(CharacterSet::setNone, "([{=,:;!%^&*\|?~+-");
780	CharacterSet setCouldBePostOp(CharacterSet::setNone, "+-");
781
782	CharacterSet setDoxygen(CharacterSet::setAlpha, "$@\\&<>#{}[]");
783
784	setWordStart = CharacterSet (CharacterSet::setAlpha, "_", true);
785
786	CharacterSet setInvalidRawFirst(CharacterSet::setNone, " )\\\t\v\f\n");
787
788	if (options.identifiersAllowDollars) {
789	setWordStart.Add(`'$'`);
790	}
791
792	int chPrevNonWhite = `' '`;
793	int visibleChars = `0`;
794	bool lastWordWasUUID = false;
795	int styleBeforeDCKeyword = SCE_JAVA_DEFAULT;
796	int styleBeforeTaskMarker = SCE_JAVA_DEFAULT;
797	bool continuationLine = false;
798	bool isIncludePreprocessor = false;
799	bool isStringInPreprocessor = false;
800	bool inRERange = false;
801	bool seenDocKeyBrace = false;
802
803	Sci_Position lineCurrent = styler.GetLine(startPos);
804	if ((MaskActive(initStyle) == SCE_JAVA_PREPROCESSOR) \|\|
805	(MaskActive(initStyle) == SCE_JAVA_COMMENTLINE) \|\|
806	(MaskActive(initStyle) == SCE_JAVA_COMMENTLINEDOC)) {
807	// Set continuationLine if last character of previous line is '\'
808	if (lineCurrent > `0`) {
809	const Sci_Position endLinePrevious = styler.LineEnd(lineCurrent - `1`);
810	if (endLinePrevious > `0`) {
811	continuationLine = styler.SafeGetCharAt(endLinePrevious-`1`) == `'\\'`;
812	}
813	}
814	}
815
816	// look back to set chPrevNonWhite properly for better regex colouring
817	if (startPos > `0`) {
818	Sci_Position back = startPos;
819	while (--back && IsSpaceEquiv(MaskActive(styler.StyleAt(back))))
820	;
821	if (MaskActive(styler.StyleAt(back)) == SCE_JAVA_OPERATOR) {
822	chPrevNonWhite = styler.SafeGetCharAt(back);
823	}
824	}
825
826	StyleContext sc(startPos, length, initStyle, styler);
827	LinePPState preproc = vlls.ForLine(lineCurrent);
828
829	bool definitionsChanged = false;
830
831	// Truncate ppDefineHistory before current line
832
833	if (!options.updatePreprocessor)
834	ppDefineHistory.clear();
835
836	std::vector<PPDefinition>::iterator itInvalid = std::find_if(ppDefineHistory.begin(), ppDefineHistory.end(),
837	[lineCurrent](const PPDefinition &p) noexcept { return p.line >= lineCurrent; });
838	if (itInvalid != ppDefineHistory.end()) {
839	ppDefineHistory.erase(itInvalid, ppDefineHistory.end());
840	definitionsChanged = true;
841	}
842
843	SymbolTable preprocessorDefinitions = preprocessorDefinitionsStart;
844	for (const PPDefinition &ppDef : ppDefineHistory) {
845	if (ppDef.isUndef)
846	preprocessorDefinitions.erase(ppDef.key);
847	else
848	preprocessorDefinitions [ppDef.key] = SymbolValue (ppDef.value, ppDef.arguments);
849	}
850
851	std::string rawStringTerminator = rawStringTerminators.ValueAt(lineCurrent-`1`);
852	SparseState<std::string> rawSTNew(lineCurrent);
853
854	int activitySet = preproc.ActiveState();
855
856	const WordClassifier &classifierIdentifiers = subStyles.Classifier(SCE_JAVA_IDENTIFIER);
857	const WordClassifier &classifierDocKeyWords = subStyles.Classifier(SCE_JAVA_COMMENTDOCKEYWORD);
858
859	Sci_PositionU lineEndNext = styler.LineEnd(lineCurrent);
860
861	for (; sc.More();) {
862
863	if (sc.atLineStart) {
864	// Using MaskActive() is not needed in the following statement.
865	// Inside inactive preprocessor declaration, state will be reset anyway at the end of this block.
866	if ((sc.state == SCE_JAVA_STRING) \|\| (sc.state == SCE_JAVA_CHARACTER)) {
867	// Prevent SCE_JAVA_STRINGEOL from leaking back to previous line which
868	// ends with a line continuation by locking in the state up to this position.
869	sc.SetState(sc.state);
870	}
871	if ((MaskActive(sc.state) == SCE_JAVA_PREPROCESSOR) && (!continuationLine)) {
872	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
873	}
874	// Reset states to beginning of colourise so no surprises
875	// if different sets of lines lexed.
876	visibleChars = `0`;
877	lastWordWasUUID = false;
878	isIncludePreprocessor = false;
879	inRERange = false;
880	if (preproc.IsInactive()) {
881	activitySet = inactiveFlag;
882	sc.SetState(sc.state \| activitySet);
883	}
884	}
885
886	if (sc.atLineEnd) {
887	lineCurrent++;
888	lineEndNext = styler.LineEnd(lineCurrent);
889	vlls.Add(lineCurrent, preproc);
890	if (rawStringTerminator != "") {
891	rawSTNew.Set(lineCurrent-`1`, rawStringTerminator);
892	}
893	}
894
895	// Handle line continuation generically.
896	if (sc.ch == `'\\'`) {
897	if ((sc.currentPos+`1`) >= lineEndNext) {
898	lineCurrent++;
899	lineEndNext = styler.LineEnd(lineCurrent);
900	vlls.Add(lineCurrent, preproc);
901	if (rawStringTerminator != "") {
902	rawSTNew.Set(lineCurrent-`1`, rawStringTerminator);
903	}
904	sc.Forward();
905	if (sc.ch == `'\r'` && sc.chNext == `'\n'`) {
906	// Even in UTF-8, \r and \n are separate
907	sc.Forward();
908	}
909	continuationLine = true;
910	sc.Forward();
911	continue;
912	}
913	}
914
915	const bool atLineEndBeforeSwitch = sc.atLineEnd;
916
917	// Determine if the current state should terminate.
918	switch (MaskActive(sc.state)) {
919	case SCE_JAVA_OPERATOR:
920	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
921	break;
922	case SCE_JAVA_NUMBER:
923	// We accept almost anything because of hex. and number suffixes
924	if (sc.ch == `'_'`) {
925	sc.ChangeState(SCE_JAVA_USERLITERAL\|activitySet);
926	} else if (!(setWord.Contains(sc.ch)
927	\|\| (sc.ch == `'\''`)
928	\|\| ((sc.ch == `'+'` \|\| sc.ch == `'-'`) && (sc.chPrev == `'e'` \|\| sc.chPrev == `'E'` \|\|
929	sc.chPrev == `'p'` \|\| sc.chPrev == `'P'`)))) {
930	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
931	}
932	break;
933	case SCE_JAVA_USERLITERAL:
934	if (!(setWord.Contains(sc.ch)))
935	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
936	break;
937	case SCE_JAVA_IDENTIFIER:
938	if (sc.atLineStart \|\| sc.atLineEnd \|\| !setWord.Contains(sc.ch) \|\| (sc.ch == `'.'`)) {
939	char s[`1000`];
940	if (caseSensitive) {
941	sc.GetCurrent(s, sizeof(s));
942	} else {
943	sc.GetCurrentLowered(s, sizeof(s));
944	}
945	if (keywords.InList(s)) {
946	lastWordWasUUID = strcmp(s, "uuid") == `0`;
947	sc.ChangeState(SCE_JAVA_WORD\|activitySet);
948	} else if (keywords2.InList(s)) {
949	sc.ChangeState(SCE_JAVA_WORD2\|activitySet);
950	} else if (keywords4.InList(s)) {
951	sc.ChangeState(SCE_JAVA_GLOBALCLASS\|activitySet);
952	} else {
953	int subStyle = classifierIdentifiers.ValueFor(s);
954	if (subStyle >= `0`) {
955	sc.ChangeState(subStyle\|activitySet);
956	}
957	}
958	const bool literalString = sc.ch == `'\"'`;
959	if (literalString \|\| sc.ch == `'\''`) {
960	size_t lenS = strlen(s);
961	const bool raw = literalString && sc.chPrev == `'R'` && !setInvalidRawFirst.Contains(sc.chNext);
962	if (raw)
963	s[lenS--] = `'\0'`;
964	const bool valid =
965	(lenS == `0`) \|\|
966	((lenS == `1`) && ((s[`0`] == `'L'`) \|\| (s[`0`] == `'u'`) \|\| (s[`0`] == `'U'`))) \|\|
967	((lenS == `2`) && literalString && (s[`0`] == `'u'`) && (s[`1`] == `'8'`));
968	if (valid) {
969	if (literalString) {
970	if (raw) {
971	// Set the style of the string prefix to SCE_JAVA_STRINGRAW but then change to
972	// SCE_JAVA_DEFAULT as that allows the raw string start code to run.
973	sc.ChangeState(SCE_JAVA_STRINGRAW\|activitySet);
974	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
975	} else {
976	sc.ChangeState(SCE_JAVA_STRING\|activitySet);
977	}
978	} else {
979	sc.ChangeState(SCE_JAVA_CHARACTER\|activitySet);
980	}
981	} else {
982	sc.SetState(SCE_JAVA_DEFAULT \| activitySet);
983	}
984	} else {
985	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
986	}
987	}
988	break;
989	case SCE_JAVA_PREPROCESSOR:
990	if (options.stylingWithinPreprocessor) {
991	if (IsASpace(sc.ch) \|\| (sc.ch == `'('`)) {
992	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
993	}
994	} else if (isStringInPreprocessor && (sc.Match(`'>'`) \|\| sc.Match(`'\"'`) \|\| sc.atLineEnd)) {
995	isStringInPreprocessor = false;
996	} else if (!isStringInPreprocessor) {
997	if ((isIncludePreprocessor && sc.Match(`'<'`)) \|\| sc.Match(`'\"'`)) {
998	isStringInPreprocessor = true;
999	} else if (sc.Match(`'/'`, `'*'`)) {
1000	if (sc.Match("/*") \|\| sc.Match("/!")) {
1001	sc.SetState(SCE_JAVA_PREPROCESSORCOMMENTDOC\|activitySet);
1002	} else {
1003	sc.SetState(SCE_JAVA_PREPROCESSORCOMMENT\|activitySet);
1004	}
1005	sc.Forward(); // Eat the *
1006	} else if (sc.Match(`'/'`, `'/'`)) {
1007	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
1008	}
1009	}
1010	break;
1011	case SCE_JAVA_PREPROCESSORCOMMENT:
1012	case SCE_JAVA_PREPROCESSORCOMMENTDOC:
1013	if (sc.Match(`'*'`, `'/'`)) {
1014	sc.Forward();
1015	sc.ForwardSetState(SCE_JAVA_PREPROCESSOR\|activitySet);
1016	continue; // Without advancing in case of '\'.
1017	}
1018	break;
1019	case SCE_JAVA_COMMENT:
1020	if (sc.Match(`'*'`, `'/'`)) {
1021	sc.Forward();
1022	sc.ForwardSetState(SCE_JAVA_DEFAULT\|activitySet);
1023	} else {
1024	styleBeforeTaskMarker = SCE_JAVA_COMMENT;
1025	highlightTaskMarker(sc, styler, activitySet, markerList, caseSensitive);
1026	}
1027	break;
1028	case SCE_JAVA_COMMENTDOC:
1029	if (sc.Match(`'*'`, `'/'`)) {
1030	sc.Forward();
1031	sc.ForwardSetState(SCE_JAVA_DEFAULT\|activitySet);
1032	} else if (sc.ch == `'@'` \|\| sc.ch == `'\\'`) { // JavaDoc and Doxygen support
1033	// Verify that we have the conditions to mark a comment-doc-keyword
1034	if ((IsASpace(sc.chPrev) \|\| sc.chPrev == `'*'`) && (!IsASpace(sc.chNext))) {
1035	styleBeforeDCKeyword = SCE_JAVA_COMMENTDOC;
1036	sc.SetState(SCE_JAVA_COMMENTDOCKEYWORD\|activitySet);
1037	}
1038	} else if ((sc.ch == `'<'` && sc.chNext != `'/'`)
1039	\|\| (sc.ch == `'/'` && sc.chPrev == `'<'`)) { // XML comment style
1040	styleBeforeDCKeyword = SCE_JAVA_COMMENTDOC;
1041	sc.ForwardSetState(SCE_JAVA_COMMENTDOCKEYWORD \| activitySet);
1042	}
1043	break;
1044	case SCE_JAVA_COMMENTLINE:
1045	if (sc.atLineStart && !continuationLine) {
1046	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
1047	} else {
1048	styleBeforeTaskMarker = SCE_JAVA_COMMENTLINE;
1049	highlightTaskMarker(sc, styler, activitySet, markerList, caseSensitive);
1050	}
1051	break;
1052	case SCE_JAVA_COMMENTLINEDOC:
1053	if (sc.atLineStart && !continuationLine) {
1054	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
1055	} else if (sc.ch == `'@'` \|\| sc.ch == `'\\'`) { // JavaDoc and Doxygen support
1056	// Verify that we have the conditions to mark a comment-doc-keyword
1057	if ((IsASpace(sc.chPrev) \|\| sc.chPrev == `'/'` \|\| sc.chPrev == `'!'`) && (!IsASpace(sc.chNext))) {
1058	styleBeforeDCKeyword = SCE_JAVA_COMMENTLINEDOC;
1059	sc.SetState(SCE_JAVA_COMMENTDOCKEYWORD\|activitySet);
1060	}
1061	} else if ((sc.ch == `'<'` && sc.chNext != `'/'`)
1062	\|\| (sc.ch == `'/'` && sc.chPrev == `'<'`)) { // XML comment style
1063	styleBeforeDCKeyword = SCE_JAVA_COMMENTLINEDOC;
1064	sc.ForwardSetState(SCE_JAVA_COMMENTDOCKEYWORD \| activitySet);
1065	}
1066	break;
1067	case SCE_JAVA_COMMENTDOCKEYWORD:
1068	if ((styleBeforeDCKeyword == SCE_JAVA_COMMENTDOC) && sc.Match(`'*'`, `'/'`)) {
1069	sc.ChangeState(SCE_JAVA_COMMENTDOCKEYWORDERROR);
1070	sc.Forward();
1071	sc.ForwardSetState(SCE_JAVA_DEFAULT\|activitySet);
1072	seenDocKeyBrace = false;
1073	} else if (sc.ch == `'['` \|\| sc.ch == `'{'`) {
1074	seenDocKeyBrace = true;
1075	} else if (!setDoxygen.Contains(sc.ch)
1076	&& !(seenDocKeyBrace && (sc.ch == `','` \|\| sc.ch == `'.'`))) {
1077	char s[`100`];
1078	if (caseSensitive) {
1079	sc.GetCurrent(s, sizeof(s));
1080	} else {
1081	sc.GetCurrentLowered(s, sizeof(s));
1082	}
1083	if (!(IsASpace(sc.ch) \|\| (sc.ch == `0`))) {
1084	sc.ChangeState(SCE_JAVA_COMMENTDOCKEYWORDERROR\|activitySet);
1085	} else if (!keywords3.InList(s + `1`) && !keywords3.InList(s)) {
1086	int subStyleCDKW = classifierDocKeyWords.ValueFor(s+`1`);
1087	if (subStyleCDKW >= `0`) {
1088	sc.ChangeState(subStyleCDKW\|activitySet);
1089	} else {
1090	sc.ChangeState(SCE_JAVA_COMMENTDOCKEYWORDERROR\|activitySet);
1091	}
1092	}
1093	sc.SetState(styleBeforeDCKeyword\|activitySet);
1094	seenDocKeyBrace = false;
1095	} else if (sc.ch == `'>'`) {
1096	char s[`100`];
1097	if (caseSensitive) {
1098	sc.GetCurrent(s, sizeof(s));
1099	} else {
1100	sc.GetCurrentLowered(s, sizeof(s));
1101	}
1102	if (!keywords3.InList(s)) {
1103	int subStyleCDKW = classifierDocKeyWords.ValueFor(s + `1`);
1104	if (subStyleCDKW >= `0`) {
1105	sc.ChangeState(subStyleCDKW \| activitySet);
1106	} else {
1107	sc.ChangeState(SCE_JAVA_COMMENTDOCKEYWORDERROR \| activitySet);
1108	}
1109	}
1110	sc.SetState(styleBeforeDCKeyword \| activitySet);
1111	seenDocKeyBrace = false;
1112	}
1113	break;
1114	case SCE_JAVA_STRING:
1115	if (sc.atLineEnd) {
1116	sc.ChangeState(SCE_JAVA_STRINGEOL\|activitySet);
1117	} else if (isIncludePreprocessor) {
1118	if (sc.ch == `'>'`) {
1119	sc.ForwardSetState(SCE_JAVA_DEFAULT\|activitySet);
1120	isIncludePreprocessor = false;
1121	}
1122	} else if (sc.ch == `'\\'`) {
1123	if (options.escapeSequence) {
1124	sc.SetState(SCE_JAVA_ESCAPESEQUENCE\|activitySet);
1125	escapeSeq.resetEscapeState(sc.chNext);
1126	}
1127	sc.Forward(); // Skip all characters after the backslash
1128	} else if (sc.ch == `'\"'`) {
1129	if (sc.chNext == `'_'`) {
1130	sc.ChangeState(SCE_JAVA_USERLITERAL\|activitySet);
1131	} else {
1132	sc.ForwardSetState(SCE_JAVA_DEFAULT\|activitySet);
1133	}
1134	}
1135	break;
1136	case SCE_JAVA_ESCAPESEQUENCE:
1137	escapeSeq.consumeDigit();
1138	if (!escapeSeq.atEscapeEnd(sc.ch)) {
1139	break;
1140	}
1141	if (sc.ch == `'"'`) {
1142	sc.SetState(SCE_JAVA_STRING\|activitySet);
1143	sc.ForwardSetState(SCE_JAVA_DEFAULT\|activitySet);
1144	} else if (sc.ch == `'\\'`) {
1145	escapeSeq.resetEscapeState(sc.chNext);
1146	sc.Forward();
1147	} else {
1148	sc.SetState(SCE_JAVA_STRING\|activitySet);
1149	if (sc.atLineEnd) {
1150	sc.ChangeState(SCE_JAVA_STRINGEOL\|activitySet);
1151	}
1152	}
1153	break;
1154	case SCE_JAVA_HASHQUOTEDSTRING:
1155	if (sc.ch == `'\\'`) {
1156	if (sc.chNext == `'\"'` \|\| sc.chNext == `'\''` \|\| sc.chNext == `'\\'`) {
1157	sc.Forward();
1158	}
1159	} else if (sc.ch == `'\"'`) {
1160	sc.ForwardSetState(SCE_JAVA_DEFAULT\|activitySet);
1161	}
1162	break;
1163	case SCE_JAVA_STRINGRAW:
1164	if (sc.Match(rawStringTerminator.c_str())) {
1165	for (size_t termPos=rawStringTerminator.size(); termPos; termPos--)
1166	sc.Forward();
1167	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
1168	rawStringTerminator = "";
1169	}
1170	break;
1171	case SCE_JAVA_CHARACTER:
1172	if (sc.atLineEnd) {
1173	sc.ChangeState(SCE_JAVA_STRINGEOL\|activitySet);
1174	} else if (sc.ch == `'\\'`) {
1175	if (sc.chNext == `'\"'` \|\| sc.chNext == `'\''` \|\| sc.chNext == `'\\'`) {
1176	sc.Forward();
1177	}
1178	} else if (sc.ch == `'\''`) {
1179	if (sc.chNext == `'_'`) {
1180	sc.ChangeState(SCE_JAVA_USERLITERAL\|activitySet);
1181	} else {
1182	sc.ForwardSetState(SCE_JAVA_DEFAULT\|activitySet);
1183	}
1184	}
1185	break;
1186	case SCE_JAVA_REGEX:
1187	if (sc.atLineStart) {
1188	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
1189	} else if (!inRERange && sc.ch == `'/'`) {
1190	sc.Forward();
1191	while (IsLowerCase(sc.ch))
1192	sc.Forward(); // gobble regex flags
1193	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
1194	} else if (sc.ch == `'\\'` && ((sc.currentPos+`1`) < lineEndNext)) {
1195	// Gobble up the escaped character
1196	sc.Forward();
1197	} else if (sc.ch == `'['`) {
1198	inRERange = true;
1199	} else if (sc.ch == `']'`) {
1200	inRERange = false;
1201	}
1202	break;
1203	case SCE_JAVA_STRINGEOL:
1204	if (sc.atLineStart) {
1205	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
1206	}
1207	break;
1208	case SCE_JAVA_VERBATIM:
1209	if (options.verbatimStringsAllowEscapes && (sc.ch == `'\\'`)) {
1210	sc.Forward(); // Skip all characters after the backslash
1211	} else if (sc.ch == `'\"'`) {
1212	if (sc.chNext == `'\"'`) {
1213	sc.Forward();
1214	} else {
1215	sc.ForwardSetState(SCE_JAVA_DEFAULT\|activitySet);
1216	}
1217	}
1218	break;
1219	case SCE_JAVA_TRIPLEVERBATIM:
1220	if (sc.Match(R"(""")")) {
1221	while (sc.Match(`'"'`)) {
1222	sc.Forward();
1223	}
1224	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
1225	}
1226	break;
1227	case SCE_JAVA_UUID:
1228	if (sc.atLineEnd \|\| sc.ch == `')'`) {
1229	sc.SetState(SCE_JAVA_DEFAULT\|activitySet);
1230	}
1231	break;
1232	case SCE_JAVA_TASKMARKER:
1233	if (isoperator(sc.ch) \|\| IsASpace(sc.ch)) {
1234	sc.SetState(styleBeforeTaskMarker\|activitySet);
1235	styleBeforeTaskMarker = SCE_JAVA_DEFAULT;
1236	}
1237	}
1238
1239	if (sc.atLineEnd && !atLineEndBeforeSwitch) {
1240	// State exit processing consumed characters up to end of line.
1241	lineCurrent++;
1242	lineEndNext = styler.LineEnd(lineCurrent);
1243	vlls.Add(lineCurrent, preproc);
1244	}
1245
1246	const bool atLineEndBeforeStateEntry = sc.atLineEnd;
1247
1248	// Determine if a new state should be entered.
1249	if (MaskActive(sc.state) == SCE_JAVA_DEFAULT) {
1250	if (sc.Match(`'@'`, `'\"'`)) {
1251	sc.SetState(SCE_JAVA_VERBATIM\|activitySet);
1252	sc.Forward();
1253	} else if (options.triplequotedStrings && sc.Match(R"(""")")) {
1254	sc.SetState(SCE_JAVA_TRIPLEVERBATIM\|activitySet);
1255	sc.Forward(`2`);
1256	} else if (options.hashquotedStrings && sc.Match(`'#'`, `'\"'`)) {
1257	sc.SetState(SCE_JAVA_HASHQUOTEDSTRING\|activitySet);
1258	sc.Forward();
1259	} else if (options.backQuotedStrings && sc.Match('`')) {
1260	sc.SetState(SCE_JAVA_STRINGRAW\|activitySet);
1261	rawStringTerminator = "`";
1262	} else if (IsADigit(sc.ch) \|\| (sc.ch == `'.'` && IsADigit(sc.chNext))) {
1263	if (lastWordWasUUID) {
1264	sc.SetState(SCE_JAVA_UUID\|activitySet);
1265	lastWordWasUUID = false;
1266	} else {
1267	sc.SetState(SCE_JAVA_NUMBER\|activitySet);
1268	}
1269	} else if (!sc.atLineEnd && (setWordStart.Contains(sc.ch) \|\| (sc.ch == `'@'`))) {
1270	if (lastWordWasUUID) {
1271	sc.SetState(SCE_JAVA_UUID\|activitySet);
1272	lastWordWasUUID = false;
1273	} else {
1274	sc.SetState(SCE_JAVA_IDENTIFIER\|activitySet);
1275	}
1276	} else if (sc.Match(`'/'`, `'*'`)) {
1277	if (sc.Match("/*") \|\| sc.Match("/!")) { // Support of Qt/Doxygen doc. style
1278	sc.SetState(SCE_JAVA_COMMENTDOC\|activitySet);
1279	} else {
1280	sc.SetState(SCE_JAVA_COMMENT\|activitySet);
1281	}
1282	sc.Forward(); // Eat the so it isn't used for the end of the comment*
1283	} else if (sc.Match(`'/'`, `'/'`)) {
1284	if ((sc.Match("///") && !sc.Match("////")) \|\| sc.Match("//!"))
1285	// Support of Qt/Doxygen doc. style
1286	sc.SetState(SCE_JAVA_COMMENTLINEDOC\|activitySet);
1287	else
1288	sc.SetState(SCE_JAVA_COMMENTLINE\|activitySet);
1289	} else if (sc.ch == `'/'`
1290	&& (setOKBeforeRE.Contains(chPrevNonWhite)
1291	\|\| followsReturnKeyword(sc, styler))
1292	&& (!setCouldBePostOp.Contains(chPrevNonWhite)
1293	\|\| !FollowsPostfixOperator(sc, styler))) {
1294	sc.SetState(SCE_JAVA_REGEX\|activitySet); // JavaScript's RegEx
1295	inRERange = false;
1296	} else if (sc.ch == `'\"'`) {
1297	if (sc.chPrev == `'R'`) {
1298	styler.Flush();
1299	if (MaskActive(styler.StyleAt(sc.currentPos - `1`)) == SCE_JAVA_STRINGRAW) {
1300	sc.SetState(SCE_JAVA_STRINGRAW\|activitySet);
1301	rawStringTerminator = ")";
1302	for (Sci_Position termPos = sc.currentPos + `1`;; termPos++) {
1303	const char chTerminator = styler.SafeGetCharAt(termPos, `'('`);
1304	if (chTerminator == `'('`)
1305	break;
1306	rawStringTerminator += chTerminator;
1307	}
1308	rawStringTerminator += `'\"'`;
1309	} else {
1310	sc.SetState(SCE_JAVA_STRING\|activitySet);
1311	}
1312	} else {
1313	sc.SetState(SCE_JAVA_STRING\|activitySet);
1314	}
1315	isIncludePreprocessor = false; // ensure that '>' won't end the string
1316	} else if (isIncludePreprocessor && sc.ch == `'<'`) {
1317	sc.SetState(SCE_JAVA_STRING\|activitySet);
1318	} else if (sc.ch == `'\''`) {
1319	sc.SetState(SCE_JAVA_CHARACTER\|activitySet);
1320	} else if (sc.ch == `'#'` && visibleChars == `0`) {
1321	// Preprocessor commands are alone on their line
1322	sc.SetState(SCE_JAVA_PREPROCESSOR\|activitySet);
1323	// Skip whitespace between # and preprocessor word
1324	do {
1325	sc.Forward();
1326	} while ((sc.ch == `' '` \|\| sc.ch == `'\t'`) && sc.More());
1327	if (sc.Match("include")) {
1328	isIncludePreprocessor = true;
1329	} else {
1330	if (options.trackPreprocessor && IsAlphaNumeric(sc.ch)) {
1331	// If #if is nested too deeply (>31 levels) the active/inactive appearance
1332	// will stop reflecting the code.
1333	if (sc.Match("ifdef") \|\| sc.Match("ifndef")) {
1334	const bool isIfDef = sc.Match("ifdef");
1335	const int startRest = isIfDef ? `5` : `6`;
1336	std::string restOfLine = GetRestOfLine(styler, sc.currentPos + startRest + `1`, false);
1337	bool foundDef = preprocessorDefinitions.find(restOfLine) != preprocessorDefinitions.end();
1338	preproc.StartSection(isIfDef == foundDef);
1339	} else if (sc.Match("if")) {
1340	std::string restOfLine = GetRestOfLine(styler, sc.currentPos + `2`, true);
1341	const bool ifGood = EvaluateExpression(restOfLine, preprocessorDefinitions);
1342	preproc.StartSection(ifGood);
1343	} else if (sc.Match("else")) {
1344	// #else is shown as active if either preceding or following section is active
1345	// as that means that it contributed to the result.
1346	if (preproc.ValidLevel()) {
1347	// If #else has no corresponding #if then take no action as invalid
1348	if (!preproc.CurrentIfTaken()) {
1349	// Inactive, may become active if parent scope active
1350	assert(sc.state == (SCE_JAVA_PREPROCESSOR \| inactiveFlag));
1351	preproc.InvertCurrentLevel();
1352	activitySet = preproc.ActiveState();
1353	// If following is active then show "else" as active
1354	if (!activitySet)
1355	sc.ChangeState(SCE_JAVA_PREPROCESSOR);
1356	} else if (preproc.IsActive()) {
1357	// Active -> inactive
1358	assert(sc.state == SCE_JAVA_PREPROCESSOR);
1359	preproc.InvertCurrentLevel();
1360	activitySet = preproc.ActiveState();
1361	// Continue to show "else" as active as it ends active section.
1362	}
1363	}
1364	} else if (sc.Match("elif")) {
1365	// Ensure only one chosen out of #if .. #elif .. #elif .. #else .. #endif
1366	// #elif is shown as active if either preceding or following section is active
1367	// as that means that it contributed to the result.
1368	if (preproc.ValidLevel()) {
1369	if (!preproc.CurrentIfTaken()) {
1370	// Inactive, if expression true then may become active if parent scope active
1371	assert(sc.state == (SCE_JAVA_PREPROCESSOR \| inactiveFlag));
1372	// Similar to #if
1373	std::string restOfLine = GetRestOfLine(styler, sc.currentPos + `4`, true);
1374	const bool ifGood = EvaluateExpression(restOfLine, preprocessorDefinitions);
1375	if (ifGood) {
1376	preproc.InvertCurrentLevel();
1377	activitySet = preproc.ActiveState();
1378	if (!activitySet)
1379	sc.ChangeState(SCE_JAVA_PREPROCESSOR);
1380	}
1381	} else if (preproc.IsActive()) {
1382	// Active -> inactive
1383	assert(sc.state == SCE_JAVA_PREPROCESSOR);
1384	preproc.InvertCurrentLevel();
1385	activitySet = preproc.ActiveState();
1386	// Continue to show "elif" as active as it ends active section.
1387	}
1388	}
1389	} else if (sc.Match("endif")) {
1390	preproc.EndSection();
1391	activitySet = preproc.ActiveState();
1392	sc.ChangeState(SCE_JAVA_PREPROCESSOR\|activitySet);
1393	} else if (sc.Match("define")) {
1394	if (options.updatePreprocessor && preproc.IsActive()) {
1395	std::string restOfLine = GetRestOfLine(styler, sc.currentPos + `6`, true);
1396	size_t startName = `0`;
1397	while ((startName < restOfLine.length()) && IsSpaceOrTab(restOfLine [startName]))
1398	startName++;
1399	size_t endName = startName;
1400	while ((endName < restOfLine.length()) && setWord.Contains(restOfLine [endName]))
1401	endName++;
1402	std::string key = restOfLine.substr(startName, endName-startName);
1403	if ((endName < restOfLine.length()) && (restOfLine.at(endName) == `'('`)) {
1404	// Macro
1405	size_t endArgs = endName;
1406	while ((endArgs < restOfLine.length()) && (restOfLine [endArgs] != `')'`))
1407	endArgs++;
1408	std::string args = restOfLine.substr(endName + `1`, endArgs - endName - `1`);
1409	size_t startValue = endArgs+`1`;
1410	while ((startValue < restOfLine.length()) && IsSpaceOrTab(restOfLine [startValue]))
1411	startValue++;
1412	std::string value;
1413	if (startValue < restOfLine.length())
1414	value = restOfLine.substr(startValue);
1415	preprocessorDefinitions [key] = SymbolValue (value, args);
1416	ppDefineHistory.push_back(PPDefinition (lineCurrent, key, value, false, args));
1417	definitionsChanged = true;
1418	} else {
1419	// Value
1420	size_t startValue = endName;
1421	while ((startValue < restOfLine.length()) && IsSpaceOrTab(restOfLine [startValue]))
1422	startValue++;
1423	std::string value = restOfLine.substr(startValue);
1424	if (OnlySpaceOrTab(value))
1425	value = "1"; // No value defaults to 1
1426	preprocessorDefinitions [key] = value;
1427	ppDefineHistory.push_back(PPDefinition (lineCurrent, key, value));
1428	definitionsChanged = true;
1429	}
1430	}
1431	} else if (sc.Match("undef")) {
1432	if (options.updatePreprocessor && preproc.IsActive()) {
1433	const std::string restOfLine = GetRestOfLine(styler, sc.currentPos + `5`, false);
1434	std::vector<std::string> tokens = Tokenize(restOfLine);
1435	if (tokens.size() >= `1`) {
1436	const std::string key = tokens [`0`];
1437	preprocessorDefinitions.erase(key);
1438	ppDefineHistory.push_back(PPDefinition (lineCurrent, key, "", true));
1439	definitionsChanged = true;
1440	}
1441	}
1442	}
1443	}
1444	}
1445	} else if (isoperator(sc.ch)) {
1446	sc.SetState(SCE_JAVA_OPERATOR\|activitySet);
1447	}
1448	}
1449
1450	if (sc.atLineEnd && !atLineEndBeforeStateEntry) {
1451	// State entry processing consumed characters up to end of line.
1452	lineCurrent++;
1453	lineEndNext = styler.LineEnd(lineCurrent);
1454	vlls.Add(lineCurrent, preproc);
1455	}
1456
1457	if (!IsASpace(sc.ch) && !IsSpaceEquiv(MaskActive(sc.state))) {
1458	chPrevNonWhite = sc.ch;
1459	visibleChars++;
1460	}
1461	continuationLine = false;
1462	sc.Forward();
1463	}
1464	const bool rawStringsChanged = rawStringTerminators.Merge(rawSTNew, lineCurrent);
1465	if (definitionsChanged \|\| rawStringsChanged)
1466	styler.ChangeLexerState(startPos, startPos + length);
1467	sc.Complete();
1468	}
1469
1470	// Store both the current line's fold level and the next lines in the
1471	// level store to make it easy to pick up with each increment
1472	// and to make it possible to fiddle the current level for "} else {".
1473
1474	void SCI_METHOD LexerJAVA::Fold(Sci_PositionU startPos, Sci_Position length, int initStyle, IDocument *pAccess) {
1475
1476	if (!options.fold)
1477	return;
1478
1479	LexAccessor styler(pAccess);
1480
1481	const Sci_PositionU endPos = startPos + length;
1482	int visibleChars = `0`;
1483	bool inLineComment = false;
1484	Sci_Position lineCurrent = styler.GetLine(startPos);
1485	int levelCurrent = SC_FOLDLEVELBASE;
1486	if (lineCurrent > `0`)
1487	levelCurrent = styler.LevelAt(lineCurrent-`1`) >> `16`;
1488	Sci_PositionU lineStartNext = styler.LineStart(lineCurrent+`1`);
1489	int levelMinCurrent = levelCurrent;
1490	int levelNext = levelCurrent;
1491	char chNext = styler [startPos];
1492	int styleNext = MaskActive(styler.StyleAt(startPos));
1493	int style = MaskActive(initStyle);
1494	const bool userDefinedFoldMarkers = !options.foldExplicitStart.empty() && !options.foldExplicitEnd.empty();
1495	for (Sci_PositionU i = startPos; i < endPos; i++) {
1496	const char ch = chNext;
1497	chNext = styler.SafeGetCharAt(i + `1`);
1498	const int stylePrev = style;
1499	style = styleNext;
1500	styleNext = MaskActive(styler.StyleAt(i + `1`));
1501	const bool atEOL = i == (lineStartNext-`1`);
1502	if ((style == SCE_JAVA_COMMENTLINE) \|\| (style == SCE_JAVA_COMMENTLINEDOC))
1503	inLineComment = true;
1504	if (options.foldComment && options.foldCommentMultiline && IsStreamCommentStyle(style) && !inLineComment) {
1505	if (!IsStreamCommentStyle(stylePrev)) {
1506	levelNext++;
1507	} else if (!IsStreamCommentStyle(styleNext) && !atEOL) {
1508	// Comments don't end at end of line and the next character may be unstyled.
1509	levelNext--;
1510	}
1511	}
1512	if (options.foldComment && options.foldCommentExplicit && ((style == SCE_JAVA_COMMENTLINE) \|\| options.foldExplicitAnywhere)) {
1513	if (userDefinedFoldMarkers) {
1514	if (styler.Match(i, options.foldExplicitStart.c_str())) {
1515	levelNext++;
1516	} else if (styler.Match(i, options.foldExplicitEnd.c_str())) {
1517	levelNext--;
1518	}
1519	} else {
1520	if ((ch == `'/'`) && (chNext == `'/'`)) {
1521	const char chNext2 = styler.SafeGetCharAt(i + `2`);
1522	if (chNext2 == `'{'`) {
1523	levelNext++;
1524	} else if (chNext2 == `'}'`) {
1525	levelNext--;
1526	}
1527	}
1528	}
1529	}
1530	if (options.foldPreprocessor && (style == SCE_JAVA_PREPROCESSOR)) {
1531	if (ch == `'#'`) {
1532	Sci_PositionU j = i + `1`;
1533	while ((j < endPos) && IsASpaceOrTab(styler.SafeGetCharAt(j))) {
1534	j++;
1535	}
1536	if (styler.Match(j, "region") \|\| styler.Match(j, "if")) {
1537	levelNext++;
1538	} else if (styler.Match(j, "end")) {
1539	levelNext--;
1540	}
1541
1542	if (options.foldPreprocessorAtElse && (styler.Match(j, "else") \|\| styler.Match(j, "elif"))) {
1543	levelMinCurrent--;
1544	}
1545	}
1546	}
1547	if (options.foldSyntaxBased && (style == SCE_JAVA_OPERATOR)) {
1548	if (ch == `'{'` \|\| ch == `'['` \|\| ch == `'('`) {
1549	// Measure the minimum before a '{' to allow
1550	// folding on "} else {"
1551	if (options.foldAtElse && levelMinCurrent > levelNext) {
1552	levelMinCurrent = levelNext;
1553	}
1554	levelNext++;
1555	} else if (ch == `'}'` \|\| ch == `']'` \|\| ch == `')'`) {
1556	levelNext--;
1557	}
1558	}
1559	if (!IsASpace(ch))
1560	visibleChars++;
1561	if (atEOL \|\| (i == endPos-`1`)) {
1562	int levelUse = levelCurrent;
1563	if ((options.foldSyntaxBased && options.foldAtElse) \|\|
1564	(options.foldPreprocessor && options.foldPreprocessorAtElse)
1565	) {
1566	levelUse = levelMinCurrent;
1567	}
1568	int lev = levelUse \| levelNext << `16`;
1569	if (visibleChars == `0` && options.foldCompact)
1570	lev \|= SC_FOLDLEVELWHITEFLAG;
1571	if (levelUse < levelNext)
1572	lev \|= SC_FOLDLEVELHEADERFLAG;
1573	if (lev != styler.LevelAt(lineCurrent)) {
1574	styler.SetLevel(lineCurrent, lev);
1575	}
1576	lineCurrent++;
1577	lineStartNext = styler.LineStart(lineCurrent+`1`);
1578	levelCurrent = levelNext;
1579	levelMinCurrent = levelCurrent;
1580	if (atEOL && (i == static_cast<Sci_PositionU>(styler.Length()-`1`))) {
1581	// There is an empty line at end of file so give it same level and empty
1582	styler.SetLevel(lineCurrent, (levelCurrent \| levelCurrent << `16`) \| SC_FOLDLEVELWHITEFLAG);
1583	}
1584	visibleChars = `0`;
1585	inLineComment = false;
1586	}
1587	}
1588	}
1589
1590	void LexerJAVA::EvaluateTokens(std::vector<std::string> &tokens, const SymbolTable &preprocessorDefinitions) {
1591
1592	// Remove whitespace tokens
1593	tokens.erase(std::remove_if(tokens.begin(), tokens.end(), OnlySpaceOrTab), tokens.end());
1594
1595	// Evaluate defined statements to either 0 or 1
1596	for (size_t i=`0`; (i+`1`)<tokens.size();) {
1597	if (tokens [i] == "defined") {
1598	const char *val = "0";
1599	if (tokens [i+`1`] == "(") {
1600	if (((i + `2`)<tokens.size()) && (tokens [i + `2`] == ")")) {
1601	// defined()
1602	tokens.erase(tokens.begin() + i + `1`, tokens.begin() + i + `3`);
1603	} else if (((i+`3`)<tokens.size()) && (tokens [i+`3`] == ")")) {
1604	// defined(<identifier>)
1605	SymbolTable::const_iterator it = preprocessorDefinitions.find(tokens [i+`2`]);
1606	if (it != preprocessorDefinitions.end()) {
1607	val = "1";
1608	}
1609	tokens.erase(tokens.begin() + i + `1`, tokens.begin() + i + `4`);
1610	} else {
1611	// Spurious '(' so erase as more likely to result in false
1612	tokens.erase(tokens.begin() + i + `1`, tokens.begin() + i + `2`);
1613	}
1614	} else {
1615	// defined <identifier>
1616	SymbolTable::const_iterator it = preprocessorDefinitions.find(tokens [i+`1`]);
1617	if (it != preprocessorDefinitions.end()) {
1618	val = "1";
1619	}
1620	tokens.erase(tokens.begin() + i + `1`, tokens.begin() + i + `2`);
1621	}
1622	tokens [i] = val;
1623	} else {
1624	i++;
1625	}
1626	}
1627
1628	// Evaluate identifiers
1629	constexpr size_t maxIterations = `100`;
1630	size_t iterations = `0`; // Limit number of iterations in case there is a recursive macro.
1631	for (size_t i = `0`; (i<tokens.size()) && (iterations < maxIterations);) {
1632	iterations++;
1633	if (setWordStart.Contains(tokens [i][`0`])) {
1634	SymbolTable::const_iterator it = preprocessorDefinitions.find(tokens [i]);
1635	if (it != preprocessorDefinitions.end()) {
1636	// Tokenize value
1637	std::vector<std::string> macroTokens = Tokenize(it ->second.value);
1638	if (it ->second.IsMacro()) {
1639	if ((i + `1` < tokens.size()) && (tokens.at(i + `1`) == "(")) {
1640	// Create map of argument name to value
1641	std::vector<std::string> argumentNames = StringSplit(it ->second.arguments, `','`);
1642	std::map<std::string, std::string> arguments;
1643	size_t arg = `0`;
1644	size_t tok = i+`2`;
1645	while ((tok < tokens.size()) && (arg < argumentNames.size()) && (tokens.at(tok) != ")")) {
1646	if (tokens.at(tok) != ",") {
1647	arguments [argumentNames.at(arg)] = tokens.at(tok);
1648	arg++;
1649	}
1650	tok++;
1651	}
1652
1653	// Remove invocation
1654	tokens.erase(tokens.begin() + i, tokens.begin() + tok + `1`);
1655
1656	// Substitute values into macro
1657	macroTokens.erase(std::remove_if(macroTokens.begin(), macroTokens.end(), OnlySpaceOrTab), macroTokens.end());
1658
1659	for (size_t iMacro = `0`; iMacro < macroTokens.size();) {
1660	if (setWordStart.Contains(macroTokens [iMacro][`0`])) {
1661	std::map<std::string, std::string>::const_iterator itFind = arguments.find(macroTokens [iMacro]);
1662	if (itFind != arguments.end()) {
1663	// TODO: Possible that value will be expression so should insert tokenized form
1664	macroTokens [iMacro] = itFind ->second;
1665	}
1666	}
1667	iMacro++;
1668	}
1669
1670	// Insert results back into tokens
1671	tokens.insert(tokens.begin() + i, macroTokens.begin(), macroTokens.end());
1672
1673	} else {
1674	i++;
1675	}
1676	} else {
1677	// Remove invocation
1678	tokens.erase(tokens.begin() + i);
1679	// Insert results back into tokens
1680	tokens.insert(tokens.begin() + i, macroTokens.begin(), macroTokens.end());
1681	}
1682	} else {
1683	// Identifier not found and value defaults to zero
1684	tokens [i] = "0";
1685	}
1686	} else {
1687	i++;
1688	}
1689	}
1690
1691	// Find bracketed subexpressions and recurse on them
1692	BracketPair bracketPair = FindBracketPair(tokens);
1693	while (bracketPair.itBracket != tokens.end()) {
1694	std::vector<std::string> inBracket(bracketPair.itBracket + `1`, bracketPair.itEndBracket);
1695	EvaluateTokens(inBracket, preprocessorDefinitions);
1696
1697	// The insertion is done before the removal because there were failures with the opposite approach
1698	tokens.insert(bracketPair.itBracket, inBracket.begin(), inBracket.end());
1699
1700	bracketPair = FindBracketPair(tokens);
1701	tokens.erase(bracketPair.itBracket, bracketPair.itEndBracket + `1`);
1702
1703	bracketPair = FindBracketPair(tokens);
1704	}
1705
1706	// Evaluate logical negations
1707	for (size_t j=`0`; (j+`1`)<tokens.size();) {
1708	if (setNegationOp.Contains(tokens [j][`0`])) {
1709	int isTrue = atoi(tokens [j+`1`].c_str());
1710	if (tokens [j] == "!")
1711	isTrue = !isTrue;
1712	std::vector<std::string>::iterator itInsert =
1713	tokens.erase(tokens.begin() + j, tokens.begin() + j + `2`);
1714	tokens.insert(itInsert, isTrue ? "1" : "0");
1715	} else {
1716	j++;
1717	}
1718	}
1719
1720	// Evaluate expressions in precedence order
1721	enum precedence { precMult, precAdd, precRelative
1722	, precLogical, / end marker / precLast };
1723	for (int prec = precMult; prec < precLast; prec++) {
1724	// Looking at 3 tokens at a time so end at 2 before end
1725	for (size_t k=`0`; (k+`2`)<tokens.size();) {
1726	const char chOp = tokens [k+`1`][`0`];
1727	if (
1728	((prec==precMult) && setMultOp.Contains(chOp)) \|\|
1729	((prec==precAdd) && setAddOp.Contains(chOp)) \|\|
1730	((prec==precRelative) && setRelOp.Contains(chOp)) \|\|
1731	((prec==precLogical) && setLogicalOp.Contains(chOp))
1732	) {
1733	const int valA = atoi(tokens [k].c_str());
1734	const int valB = atoi(tokens [k+`2`].c_str());
1735	int result = `0`;
1736	if (tokens [k+`1`] == "+")
1737	result = valA + valB;
1738	else if (tokens [k+`1`] == "-")
1739	result = valA - valB;
1740	else if (tokens [k+`1`] == "*")
1741	result = valA * valB;
1742	else if (tokens [k+`1`] == "/")
1743	result = valA / (valB ? valB : `1`);
1744	else if (tokens [k+`1`] == "%")
1745	result = valA % (valB ? valB : `1`);
1746	else if (tokens [k+`1`] == "<")
1747	result = valA < valB;
1748	else if (tokens [k+`1`] == "<=")
1749	result = valA <= valB;
1750	else if (tokens [k+`1`] == ">")
1751	result = valA > valB;
1752	else if (tokens [k+`1`] == ">=")
1753	result = valA >= valB;
1754	else if (tokens [k+`1`] == "==")
1755	result = valA == valB;
1756	else if (tokens [k+`1`] == "!=")
1757	result = valA != valB;
1758	else if (tokens [k+`1`] == "\|\|")
1759	result = valA \|\| valB;
1760	else if (tokens [k+`1`] == "&&")
1761	result = valA && valB;
1762	std::vector<std::string>::iterator itInsert =
1763	tokens.erase(tokens.begin() + k, tokens.begin() + k + `3`);
1764	tokens.insert(itInsert, std::to_string(result));
1765	} else {
1766	k++;
1767	}
1768	}
1769	}
1770	}
1771
1772	std::vector<std::string> LexerJAVA::Tokenize(const std::string &expr) const {
1773	// Break into tokens
1774	std::vector<std::string> tokens;
1775	const char *cp = expr.c_str();
1776	while (*cp) {
1777	std::string word;
1778	if (setWord.Contains(*cp)) {
1779	// Identifiers and numbers
1780	while (setWord.Contains(*cp)) {
1781	word += *cp;
1782	cp++;
1783	}
1784	} else if (IsSpaceOrTab(*cp)) {
1785	while (IsSpaceOrTab(*cp)) {
1786	word += *cp;
1787	cp++;
1788	}
1789	} else if (setRelOp.Contains(*cp)) {
1790	word += *cp;
1791	cp++;
1792	if (setRelOp.Contains(*cp)) {
1793	word += *cp;
1794	cp++;
1795	}
1796	} else if (setLogicalOp.Contains(*cp)) {
1797	word += *cp;
1798	cp++;
1799	if (setLogicalOp.Contains(*cp)) {
1800	word += *cp;
1801	cp++;
1802	}
1803	} else {
1804	// Should handle strings, characters, and comments here
1805	word += *cp;
1806	cp++;
1807	}
1808	tokens.push_back(word);
1809	}
1810	return tokens;
1811	}
1812
1813	bool LexerJAVA::EvaluateExpression(const std::string &expr, const SymbolTable &preprocessorDefinitions) {
1814	std::vector<std::string> tokens = Tokenize(expr);
1815
1816	EvaluateTokens(tokens, preprocessorDefinitions);
1817
1818	// "0" or "" -> false else true
1819	const bool isFalse = tokens.empty() \|\|
1820	((tokens.size() == `1`) && ((tokens [`0`] == "") \|\| tokens [`0`] == "0"));
1821	return !isFalse;
1822	}
1823
1824	LexerModule lmJAVA(SCLEX_JAVA, LexerJAVA::LexerFactoryJAVA, "java", javaWordLists);
1825	LexerModule lmJAVANoCase(SCLEX_JAVANOCASE, LexerJAVA::LexerFactoryJAVAInsensitive, "javanocase", javaWordLists);
1826

Browse the source code of DeepinIDE/3rdparty/unioncode-scintilla515/lexilla/lexers/LexJAVA.cxx