shithub: rgbds

--- a/src/asm/lexer.c

+++ b/src/asm/lexer.c

@@ -865,7 +865,7 @@

 /* forward declarations for peek */

-static void shiftChars(uint8_t distance);

+static void shiftChar(void);

 static char const *readInterpolation(void);

 static int peek(uint8_t distance)

@@ -889,7 +889,8 @@

 				 * expanded, so skip it and keep peeking.

*/

 				if (!str[0]) {

-					shiftChars(2);

+					shiftChar();

+					shiftChar();

 					goto restart;

@@ -909,7 +910,7 @@

 		} else if (c == '{' && !lexerState->disableInterpolation) {

 			/* If character is an open brace, do symbol interpolation */

-			shiftChars(1);

+			shiftChar();

 			char const *ptr = readInterpolation();

 			if (ptr) {

@@ -922,24 +923,24 @@

 	return c;

-static void shiftChars(uint8_t distance)

+static void shiftChar(void)

 	if (lexerState->capturing) {

 		if (lexerState->captureBuf) {

-			if (lexerState->captureSize + distance >= lexerState->captureCapacity)

+			if (lexerState->captureSize + 1 >= lexerState->captureCapacity)

 				reallocCaptureBuf();

 			/* TODO: improve this? */

-			for (uint8_t i = 0; i < distance; i++)

-				lexerState->captureBuf[lexerState->captureSize++] = peek(i);

-		} else {

-			lexerState->captureSize += distance;

+			lexerState->captureBuf[lexerState->captureSize] = peek(0);

+		lexerState->captureSize++;

-	lexerState->macroArgScanDistance -= distance;

+	lexerState->macroArgScanDistance--;

 	/* FIXME: this may not be too great, as only the top level is considered... */

+	uint8_t distance = 1;

/*

 	 * The logic is as follows:

 	 * - Any characters up to the expansion need to be consumed in the file

@@ -997,7 +998,7 @@

 	/* If not at EOF, advance read position */

 	if (c != EOF)

-		shiftChars(1);

+		shiftChar();

 	return c;

@@ -1004,7 +1005,7 @@

 static void handleCRLF(int c)

 	if (c == '\r' && peek(0) == '\n')

-		shiftChars(1);

+		shiftChar();

 /* "Services" provided by the lexer to the rest of the program */

@@ -1060,7 +1061,7 @@

 			error("Unterminated block comment\n");

 			goto finish;

 		case '\r':

-			/* Handle CRLF before nextLine() since shiftChars updates colNo */

+			/* Handle CRLF before nextLine() since shiftChar updates colNo */

 			handleCRLF(c);

 			/* fallthrough */

 		case '\n':

@@ -1075,7 +1076,7 @@

 			continue;

 		case '*':

 			if (peek(0) == '/') {

-				shiftChars(1);

+				shiftChar();

 				goto finish;

 			/* fallthrough */

@@ -1100,7 +1101,7 @@

 		if (c == EOF || c == '\r' || c == '\n')

 			break;

-		shiftChars(1);

+		shiftChar();

 	lexerState->disableMacroArgs = false;

 	lexerState->disableInterpolation = false;

@@ -1115,10 +1116,10 @@

 		int c = peek(0);

 		if (isWhitespace(c)) {

-			shiftChars(1);

+			shiftChar();

 		} else if (c == '\r' || c == '\n') {

-			shiftChars(1);

-			/* Handle CRLF before nextLine() since shiftChars updates colNo */

+			shiftChar();

+			/* Handle CRLF before nextLine() since shiftChar updates colNo */

 			handleCRLF(c);

 			if (!lexerState->expansions || lexerState->expansions->distance)

 				nextLine();

@@ -1141,7 +1142,7 @@

 	// We come here having already peeked at one char, so no need to do it again

 	do {

-		shiftChars(1);

+		shiftChar();

 		n++;

 	} while (peek(0) == c);

@@ -1154,7 +1155,7 @@

 	uint32_t value = baseValue;

-	for (;; shiftChars(1)) {

+	for (;; shiftChar()) {

 		int c = peek(0);

 		if (c == '_')

@@ -1174,7 +1175,7 @@

 	uint32_t value = 0, divisor = 1;

 	dbgPrint("Reading fractional part\n");

-	for (;; shiftChars(1)) {

+	for (;; shiftChar()) {

 		int c = peek(0);

 		if (c == '_')

@@ -1185,9 +1186,9 @@

 			warning(WARNING_LARGE_CONSTANT,

 				"Precision of fixed-point constant is too large\n");

 			/* Discard any additional digits */

-			shiftChars(1);

+			shiftChar();

 			while (c = peek(0), (c >= '0' && c <= '9') || c == '_')

-				shiftChars(1);

+				shiftChar();

 			break;

 		value = value * 10 + (c - '0');

@@ -1212,7 +1213,7 @@

 	uint32_t value = 0;

 	dbgPrint("Reading binary number with digits [%c,%c]\n", binDigits[0], binDigits[1]);

-	for (;; shiftChars(1)) {

+	for (;; shiftChar()) {

 		int c = peek(0);

 		int bit;

@@ -1238,7 +1239,7 @@

 	bool empty = true;

 	dbgPrint("Reading hex number\n");

-	for (;; shiftChars(1)) {

+	for (;; shiftChar()) {

 		int c = peek(0);

 		if (c >= 'a' && c <= 'f') /* Convert letters to right after digits */

@@ -1295,7 +1296,7 @@

 		if (width < 9)

 			width++;

-		shiftChars(1);

+		shiftChar();

 	if (width == 0)

@@ -1332,7 +1333,7 @@

 		 && (c > 'z' || c < 'a')

 		 && c != '#' && c != '.' && c != '@' && c != '_')

 			break;

-		shiftChars(1);

+		shiftChar();

 		/* Write the char to the identifier's name */

 		if (i < sizeof(yylval.tzSym) - 1)

@@ -1372,7 +1373,7 @@

 		int c = peek(0);

 		if (c == '{') { /* Nested interpolation */

-			shiftChars(1);

+			shiftChar();

 			char const *ptr = readInterpolation();

 			if (ptr) {

@@ -1383,10 +1384,10 @@

 			error("Missing }\n");

 			break;

 		} else if (c == '}') {

-			shiftChars(1);

+			shiftChar();

 			break;

 		} else if (c == ':' && !fmt_IsFinished(&fmt)) { /* Format spec, only once */

-			shiftChars(1);

+			shiftChar();

 			for (size_t j = 0; j < i; j++)

 				fmt_UseCharacter(&fmt, symName[j]);

 			fmt_FinishCharacters(&fmt);

@@ -1395,7 +1396,7 @@

 				error("Invalid format spec '%s'\n", symName);

 			i = 0; /* Now that format has been set, restart at beginning of string */

 		} else {

-			shiftChars(1);

+			shiftChar();

 			if (i < sizeof(symName)) /* Allow writing an extra char to flag overflow */

 				symName[i++] = c;

@@ -1483,10 +1484,10 @@

 	// We reach this function after reading a single quote, but we also support triple quotes

 	if (peek(0) == '"') {

-		shiftChars(1);

+		shiftChar();

 		if (peek(0) == '"') {

 			// """ begins a multi-line string

-			shiftChars(1);

+			shiftChar();

 			multiline = true;

 		} else {

 			// "" is an empty string, skip the loop

@@ -1504,11 +1505,11 @@

 		// We'll be staying in the string, so we can safely consume the char

-		shiftChars(1);

+		shiftChar();

 		// Handle '\r' or '\n' (in multiline strings only, already handled above otherwise)

 		if (c == '\r' || c == '\n') {

-			/* Handle CRLF before nextLine() since shiftChars updates colNo */

+			/* Handle CRLF before nextLine() since shiftChar updates colNo */

 			handleCRLF(c);

 			nextLine();

 			c = '\n';

@@ -1520,12 +1521,12 @@

 				// Only """ ends a multi-line string

 				if (peek(0) != '"')

 					break;

-				shiftChars(1);

+				shiftChar();

 				if (peek(0) != '"') {

 					append_yylval_tzString('"');

 					break;

-				shiftChars(1);

+				shiftChar();

 			goto finish;

@@ -1537,19 +1538,19 @@

 			case '{':

 			case '}':

 				// Return that character unchanged

-				shiftChars(1);

+				shiftChar();

 				break;

 			case 'n':

 				c = '\n';

-				shiftChars(1);

+				shiftChar();

 				break;

 			case 'r':

 				c = '\r';

-				shiftChars(1);

+				shiftChar();

 				break;

 			case 't':

 				c = '\t';

-				shiftChars(1);

+				shiftChar();

 				break;

 			// Line continuation

@@ -1572,7 +1573,7 @@

 			case '7':

 			case '8':

 			case '9':

-				shiftChars(1);

+				shiftChar();

 				char const *str = readMacroArg(c);

 				while (*str)

@@ -1586,7 +1587,7 @@

 			default:

 				error("Illegal character escape %s\n", printChar(c));

-				shiftChars(1);

+				shiftChar();

 				break;

 			break;

@@ -1633,11 +1634,11 @@

 	append_yylval_tzString('"');

 	if (peek(0) == '"') {

 		append_yylval_tzString('"');

-		shiftChars(1);

+		shiftChar();

 		if (peek(0) == '"') {

 			// """ begins a multi-line string

 			append_yylval_tzString('"');

-			shiftChars(1);

+			shiftChar();

 			multiline = true;

 		} else {

 			// "" is an empty string, skip the loop

@@ -1655,11 +1656,11 @@

 		// We'll be staying in the string, so we can safely consume the char

-		shiftChars(1);

+		shiftChar();

 		// Handle '\r' or '\n' (in multiline strings only, already handled above otherwise)

 		if (c == '\r' || c == '\n') {

-			/* Handle CRLF before nextLine() since shiftChars updates colNo */

+			/* Handle CRLF before nextLine() since shiftChar updates colNo */

 			handleCRLF(c);

 			nextLine();

 			c = '\n';

@@ -1672,11 +1673,11 @@

 				if (peek(0) != '"')

 					break;

 				append_yylval_tzString('"');

-				shiftChars(1);

+				shiftChar();

 				if (peek(0) != '"')

 					break;

 				append_yylval_tzString('"');

-				shiftChars(1);

+				shiftChar();

 			append_yylval_tzString('"');

 			goto finish;

@@ -1694,7 +1695,7 @@

 			case 't':

 				// Return that character unchanged

 				append_yylval_tzString('\\');

-				shiftChars(1);

+				shiftChar();

 				break;

 			// Line continuation

@@ -1717,7 +1718,7 @@

 			case '7':

 			case '8':

 			case '9':

-				shiftChars(1);

+				shiftChar();

 				char const *str = readMacroArg(c);

 				i = appendEscapedSubstring(str, i);

@@ -1731,12 +1732,12 @@

 			case ',': /* `\,` inside a macro arg string literal */

 				warning(WARNING_OBSOLETE,

 					"`\\,` is deprecated inside strings\n");

-				shiftChars(1);

+				shiftChar();

 				break;

 			default:

 				error("Illegal character escape %s\n", printChar(c));

-				shiftChars(1);

+				shiftChar();

 				break;

 			break;

@@ -1833,7 +1834,7 @@

 		case '*': /* Either MUL or EXP */

 			if (peek(0) == '*') {

-				shiftChars(1);

+				shiftChar();

 				return T_OP_EXP;

 			return T_OP_MUL;

@@ -1840,7 +1841,7 @@

 		case '/': /* Either division or a block comment */

 			if (peek(0) == '*') {

-				shiftChars(1);

+				shiftChar();

 				discardBlockComment();

 				break;

@@ -1848,7 +1849,7 @@

 		case '|': /* Either binary or logical OR */

 			if (peek(0) == '|') {

-				shiftChars(1);

+				shiftChar();

 				return T_OP_LOGICOR;

 			return T_OP_OR;

@@ -1855,7 +1856,7 @@

 		case '=': /* Either SET alias, or EQ */

 			if (peek(0) == '=') {

-				shiftChars(1);

+				shiftChar();

 				return T_OP_LOGICEQU;

 			return T_POP_EQUAL;

@@ -1863,10 +1864,10 @@

 		case '<': /* Either a LT, LTE, or left shift */

 			switch (peek(0)) {

 			case '=':

-				shiftChars(1);

+				shiftChar();

 				return T_OP_LOGICLE;

 			case '<':

-				shiftChars(1);

+				shiftChar();

 				return T_OP_SHL;

 			default:

 				return T_OP_LOGICLT;

@@ -1875,10 +1876,10 @@

 		case '>': /* Either a GT, GTE, or right shift */

 			switch (peek(0)) {

 			case '=':

-				shiftChars(1);

+				shiftChar();

 				return T_OP_LOGICGE;

 			case '>':

-				shiftChars(1);

+				shiftChar();

 				return T_OP_SHR;

 			default:

 				return T_OP_LOGICGT;

@@ -1886,7 +1887,7 @@

 		case '!': /* Either a NEQ, or negation */

 			if (peek(0) == '=') {

-				shiftChars(1);

+				shiftChar();

 				return T_OP_LOGICNE;

 			return T_OP_LOGICNOT;

@@ -1910,13 +1911,13 @@

 			if (yylval.nConstValue == 0xff00) {

 				/* Whitespace is ignored anyways */

 				while (isWhitespace(c = peek(0)))

-					shiftChars(1);

+					shiftChar();

 				if (c == '+') {

-					shiftChars(1);

+					shiftChar();

 					while (isWhitespace(c = peek(0)))

-						shiftChars(1);

+						shiftChar();

 					if (c == 'c' || c == 'C') {

-						shiftChars(1);

+						shiftChar();

 						return T_MODE_HW_C;

 					/* Retroactively lex the plus after the $ff00 */

@@ -1937,7 +1938,7 @@

 		case '9':

 			readNumber(10, c - '0');

 			if (peek(0) == '.') {

-				shiftChars(1);

+				shiftChar();

 				readFractionalPart();

 			return T_NUMBER;

@@ -1945,7 +1946,7 @@

 		case '&':

 			secondChar = peek(0);

 			if (secondChar == '&') {

-				shiftChars(1);

+				shiftChar();

 				return T_OP_LOGICAND;

 			} else if (secondChar >= '0' && secondChar <= '7') {

 				readNumber(8, 0);

@@ -2047,7 +2048,7 @@

 	/* Trim left whitespace (stops at a block comment or line continuation) */

 	while (isWhitespace(peek(0)))

-		shiftChars(1);

+		shiftChar();

 	for (;;) {

 		c = peek(0);

@@ -2054,7 +2055,7 @@

 		switch (c) {

 		case '"': /* String literals inside macro args */

-			shiftChars(1);

+			shiftChar();

 			i = appendStringLiteral(i);

 			break;

@@ -2069,9 +2070,9 @@

 			goto finish;

 		case '/': /* Block comments inside macro args */

-			shiftChars(1); /* Shift the slash */

+			shiftChar();

 			if (peek(0) == '*') {

-				shiftChars(1);

+				shiftChar();

 				discardBlockComment();

 				continue;

@@ -2079,7 +2080,7 @@

 			break;

 		case '\\': /* Character escape */

-			shiftChars(1); /* Shift the backslash */

+			shiftChar();

 			c = peek(0);

 			switch (c) {

@@ -2124,7 +2125,7 @@

 		default: /* Regular characters will just get copied */

 			append_yylval_tzString(c);

-			shiftChars(1);

+			shiftChar();

 			break;

@@ -2146,7 +2147,7 @@

 	// then T_COMMA) without advancing the read. To avoid this, commas in raw

 	// mode end the current macro argument but are not tokenized themselves.

 	if (c == ',') {

-		shiftChars(1);

+		shiftChar();

 		return T_STRING;

@@ -2161,7 +2162,7 @@

 	lexer_SetMode(LEXER_NORMAL);

 	if (c == '\r' || c == '\n') {

-		shiftChars(1);

+		shiftChar();

 		handleCRLF(c);

 		return T_NEWLINE;

@@ -2198,11 +2199,11 @@

 				c = peek(0);

 				if (!isWhitespace(c))

 					break;

-				shiftChars(1);

+				shiftChar();

 			if (startsIdentifier(c)) {

-				shiftChars(1);

+				shiftChar();

 				token = readIdentifier(c);

 				switch (token) {

 				case T_POP_IF:

@@ -2248,7 +2249,7 @@

 			if (c == '\r' || c == '\n') {

-				/* Handle CRLF before nextLine() since shiftChars updates colNo */

+				/* Handle CRLF before nextLine() since shiftChar updates colNo */

 				handleCRLF(c);

 				/* Do this both on line continuations and plain EOLs */

 				nextLine();

@@ -2293,11 +2294,11 @@

 				c = peek(0);

 				if (!isWhitespace(c))

 					break;

-				shiftChars(1);

+				shiftChar();

 			if (startsIdentifier(c)) {

-				shiftChars(1);

+				shiftChar();

 				switch (readIdentifier(c)) {

 				case T_POP_FOR:

 				case T_POP_REPT:

@@ -2335,7 +2336,7 @@

 			if (c == '\r' || c == '\n') {

-				/* Handle CRLF before nextLine() since shiftChars updates colNo */

+				/* Handle CRLF before nextLine() since shiftChar updates colNo */

 				handleCRLF(c);

 				/* Do this both on line continuations and plain EOLs */

 				nextLine();