diff --git a/docs/docs/en/changelog.md b/docs/docs/en/changelog.md index ba4145e7..bff44f1d 100644 --- a/docs/docs/en/changelog.md +++ b/docs/docs/en/changelog.md @@ -10,6 +10,7 @@ ### Changes - Introducing Constants. Constant can be imported only when using a module. +- Support for long number declaration: `700L`, `0xABL` - Fixed variables scope in shadowing. - Better error visualizing. Parse errors shows exact line in which an error occurs. Same for Linter and Runtime errors. - Semantic linter as a required stage. diff --git a/docs/docs/ru/changelog.md b/docs/docs/ru/changelog.md index 038b82db..01c7b25f 100644 --- a/docs/docs/ru/changelog.md +++ b/docs/docs/ru/changelog.md @@ -10,6 +10,7 @@ ### Изменения - Добавлены константы. Константа может быть импортирована только при подключении модуля. +- Возможность задать числа типа long: `700L`, `0xABL` - Исправлена область видимости переменных при шедоуинге. - Улучшена визуализация ошибок. Ошибки парсинга показывают конкретное место, где возникла ошибка. То же самое с линтером и ошибками времени исполнения. - Семантический линтер как обязательный этап работы интерпретатора. diff --git a/ownlang-parser/src/main/java/com/annimon/ownlang/parser/Lexer.java b/ownlang-parser/src/main/java/com/annimon/ownlang/parser/Lexer.java index 72663ef3..aea3a268 100644 --- a/ownlang-parser/src/main/java/com/annimon/ownlang/parser/Lexer.java +++ b/ownlang-parser/src/main/java/com/annimon/ownlang/parser/Lexer.java @@ -167,7 +167,8 @@ private void tokenizeNumber() { while (true) { if (current == '.') { decimal = true; - if (hasDot) throw error("Invalid float number " + buffer, startPos); + if (hasDot) + throw error("Invalid float number " + buffer, startPos); hasDot = true; } else if (current == 'e' || current == 'E') { decimal = true; @@ -182,6 +183,9 @@ private void tokenizeNumber() { } if (decimal) { addToken(TokenType.DECIMAL_NUMBER, buffer.toString(), startPos); + } else if (current == 'L') { + next(); + addToken(TokenType.LONG_NUMBER, buffer.toString(), startPos); } else { addToken(TokenType.NUMBER, buffer.toString(), startPos); } @@ -232,7 +236,12 @@ private void tokenizeHexNumber(int skipChars) { if (buffer.isEmpty()) throw error("Empty HEX value", startPos); if (peek(-1) == '_') throw error("HEX value cannot end with _", startPos, markEndPos()); - addToken(TokenType.HEX_NUMBER, buffer.toString(), startPos); + if (current == 'L') { + next(); + addToken(TokenType.HEX_LONG_NUMBER, buffer.toString(), startPos); + } else { + addToken(TokenType.HEX_NUMBER, buffer.toString(), startPos); + } } private static boolean isNumber(char current) { diff --git a/ownlang-parser/src/main/java/com/annimon/ownlang/parser/Parser.java b/ownlang-parser/src/main/java/com/annimon/ownlang/parser/Parser.java index 45bc8a78..689f19c9 100644 --- a/ownlang-parser/src/main/java/com/annimon/ownlang/parser/Parser.java +++ b/ownlang-parser/src/main/java/com/annimon/ownlang/parser/Parser.java @@ -50,6 +50,14 @@ public static Node parse(List tokens) { ASSIGN_OPERATORS.put(TokenType.ATEQ, BinaryExpression.Operator.AT); } + private static final EnumSet NUMBER_TOKEN_TYPES = EnumSet.of( + TokenType.NUMBER, + TokenType.LONG_NUMBER, + TokenType.DECIMAL_NUMBER, + TokenType.HEX_NUMBER, + TokenType.HEX_LONG_NUMBER + ); + private final List tokens; private final int size; private final ParseErrors parseErrors; @@ -347,7 +355,7 @@ private Node functionChain(Node qualifiedNameExpr) { } if (lookMatch(0, TokenType.DOT)) { final List indices = variableSuffix(); - if (indices == null || indices.isEmpty()) { + if (indices.isEmpty()) { return expr; } @@ -411,20 +419,10 @@ private MatchExpression match() { consume(TokenType.CASE); MatchExpression.Pattern pattern = null; final Token current = get(0); - if (match(TokenType.NUMBER)) { - // case 20: - pattern = new MatchExpression.ConstantPattern( - NumberValue.of(createNumber(current.text(), 10)) - ); - } else if (match(TokenType.DECIMAL_NUMBER)) { - // case 0.5: - pattern = new MatchExpression.ConstantPattern( - NumberValue.of(createDecimalNumber(current.text())) - ); - } else if (match(TokenType.HEX_NUMBER)) { - // case #FF: + if (isNumberToken(current.type())) { + // case 20: / case 0.5: / case #FF: pattern = new MatchExpression.ConstantPattern( - NumberValue.of(createNumber(current.text(), 16)) + NumberValue.of(getAsNumber(current)) ); } else if (match(TokenType.TEXT)) { // case "text": @@ -859,7 +857,7 @@ private Node qualifiedName() { final List indices = variableSuffix(); final var variable = new VariableExpression(current.text()); variable.setRange(getRange(startTokenIndex, index - 1)); - if (indices == null || indices.isEmpty()) { + if (indices.isEmpty()) { return variable; } else { return new ContainerAccessExpression(variable, indices, variable.getRange()); @@ -869,7 +867,7 @@ private Node qualifiedName() { private List variableSuffix() { // .key1.arr1[expr1][expr2].key2 if (!lookMatch(0, TokenType.DOT) && !lookMatch(0, TokenType.LBRACKET)) { - return null; + return Collections.emptyList(); } final List indices = new ArrayList<>(); while (lookMatch(0, TokenType.DOT) || lookMatch(0, TokenType.LBRACKET)) { @@ -888,47 +886,72 @@ private List variableSuffix() { private Node value() { final Token current = get(0); - if (match(TokenType.NUMBER)) { - return new ValueExpression(createNumber(current.text(), 10)); - } - if (match(TokenType.DECIMAL_NUMBER)) { - return new ValueExpression(createDecimalNumber(current.text())); - } - if (match(TokenType.HEX_NUMBER)) { - return new ValueExpression(createNumber(current.text(), 16)); + if (isNumberToken(current.type())) { + return new ValueExpression(getAsNumber(current)); } if (match(TokenType.TEXT)) { final ValueExpression strExpr = new ValueExpression(current.text()); // "text".property || "text".func() if (lookMatch(0, TokenType.DOT)) { - if (lookMatch(1, TokenType.WORD) && lookMatch(2, TokenType.LPAREN)) { - match(TokenType.DOT); - return functionChain(new ContainerAccessExpression( - strExpr, - Collections.singletonList(new ValueExpression(consume(TokenType.WORD).text())), - getRange() - )); - } - final List indices = variableSuffix(); - if (indices == null || indices.isEmpty()) { - return strExpr; - } - return new ContainerAccessExpression(strExpr, indices, getRange()); + return stringProperty(strExpr); } return strExpr; } throw error("Unknown expression: " + current); } + private Node stringProperty(ValueExpression strExpr) { + if (lookMatch(1, TokenType.WORD) && lookMatch(2, TokenType.LPAREN)) { + match(TokenType.DOT); + return functionChain(new ContainerAccessExpression( + strExpr, + Collections.singletonList(new ValueExpression(consume(TokenType.WORD).text())), + getRange() + )); + } + final List indices = variableSuffix(); + if (indices.isEmpty()) { + return strExpr; + } + return new ContainerAccessExpression(strExpr, indices, getRange()); + } + + private boolean isNumberToken(TokenType type) { + return NUMBER_TOKEN_TYPES.contains(type); + } + + private Number getAsNumber(Token current) { + if (match(TokenType.NUMBER)) { + return createNumber(current.text(), 10); + } + if (match(TokenType.LONG_NUMBER)) { + return createLongNumber(current.text(), 10); + } + if (match(TokenType.DECIMAL_NUMBER)) { + return createDecimalNumber(current.text()); + } + if (match(TokenType.HEX_NUMBER)) { + return createNumber(current.text(), 16); + } + if (match(TokenType.HEX_LONG_NUMBER)) { + return createLongNumber(current.text(), 16); + } + throw error("Unknown number expression: " + current); + } + private Number createNumber(String text, int radix) { // Integer try { return Integer.parseInt(text, radix); } catch (NumberFormatException nfe) { - return Long.parseLong(text, radix); + return createLongNumber(text, radix); } } + private Number createLongNumber(String text, int radix) { + return Long.parseLong(text, radix); + } + private Number createDecimalNumber(String text) { // Double return Double.parseDouble(text); diff --git a/ownlang-parser/src/main/java/com/annimon/ownlang/parser/TokenType.java b/ownlang-parser/src/main/java/com/annimon/ownlang/parser/TokenType.java index cf6a71db..7c7f2c06 100644 --- a/ownlang-parser/src/main/java/com/annimon/ownlang/parser/TokenType.java +++ b/ownlang-parser/src/main/java/com/annimon/ownlang/parser/TokenType.java @@ -7,8 +7,10 @@ public enum TokenType { NUMBER, + LONG_NUMBER, DECIMAL_NUMBER, HEX_NUMBER, + HEX_LONG_NUMBER, WORD, TEXT, diff --git a/ownlang-parser/src/test/java/com/annimon/ownlang/parser/LexerTest.java b/ownlang-parser/src/test/java/com/annimon/ownlang/parser/LexerTest.java index 062cfc8e..22bbba93 100644 --- a/ownlang-parser/src/test/java/com/annimon/ownlang/parser/LexerTest.java +++ b/ownlang-parser/src/test/java/com/annimon/ownlang/parser/LexerTest.java @@ -41,17 +41,17 @@ public static Stream invalidData() { } @Test - public void testNumbers() { - String input = "0 3.1415 0xCAFEBABE 0Xf7_d6_c5 #FFFF"; + void testNumbers() { + String input = "0 800L 3.1415 0xCAFEBABE 0Xf7_d6_c5 #FFFF 0x7FL"; List result = Lexer.tokenize(input); - assertTokens(result, NUMBER, DECIMAL_NUMBER, HEX_NUMBER, HEX_NUMBER, HEX_NUMBER); + assertTokens(result, NUMBER, LONG_NUMBER, DECIMAL_NUMBER, HEX_NUMBER, HEX_NUMBER, HEX_NUMBER, HEX_LONG_NUMBER); assertThat(result) .extracting(Token::text) - .containsExactly("0", "3.1415", "CAFEBABE", "f7d6c5", "FFFF"); + .containsExactly("0", "800", "3.1415", "CAFEBABE", "f7d6c5", "FFFF", "7F"); } @Test - public void testDecimalNumbersExponent() { + void testDecimalNumbersExponent() { String input = "4e+7 0.3E-19 2e0 5e0000000000000200 5E-000000089"; List result = Lexer.tokenize(input); assertThat(result) @@ -61,7 +61,7 @@ public void testDecimalNumbersExponent() { } @Test - public void testString() { + void testString() { String input = "\"1\\\"2\""; List result = Lexer.tokenize(input); assertTokens(result, TEXT); @@ -69,7 +69,7 @@ public void testString() { } @Test - public void testEscapeString() { + void testEscapeString() { String input = """ "\\\\/\\\\" """.stripIndent(); @@ -79,7 +79,7 @@ public void testEscapeString() { } @Test - public void testEmptyString() { + void testEmptyString() { String input = "\"\""; List result = Lexer.tokenize(input); assertTokens(result, TEXT); @@ -87,7 +87,7 @@ public void testEmptyString() { } @Test - public void testComments() { + void testComments() { String input = "// 1234 \n /* */ 123 /* \n 12345 \n\n\n */"; List result = Lexer.tokenize(input); assertTokens(result, NUMBER); @@ -96,7 +96,7 @@ public void testComments() { @ParameterizedTest @MethodSource("validData") - public void testValidInput(String name, String input, List tokenTypes) throws IOException { + void testValidInput(String name, String input, List tokenTypes) throws IOException { List result = Lexer.tokenize(input); assertThat(result) .hasSize(tokenTypes.size()) @@ -106,7 +106,7 @@ public void testValidInput(String name, String input, List tokenTypes @ParameterizedTest @MethodSource("invalidData") - public void testInvalidInput(String name, String input) throws IOException { + void testInvalidInput(String name, String input) throws IOException { assertThatThrownBy(() -> Lexer.tokenize(input)) .isInstanceOf(OwnLangParserException.class); } diff --git a/ownlang-parser/src/test/java/com/annimon/ownlang/parser/LexerValidDataProvider.java b/ownlang-parser/src/test/java/com/annimon/ownlang/parser/LexerValidDataProvider.java index 891eab2e..a22e99ed 100644 --- a/ownlang-parser/src/test/java/com/annimon/ownlang/parser/LexerValidDataProvider.java +++ b/ownlang-parser/src/test/java/com/annimon/ownlang/parser/LexerValidDataProvider.java @@ -33,7 +33,10 @@ private static List numbers() { List.of(DECIMAL_NUMBER)), Arguments.of("Hex numbers", "#FF 0xCA 0x12fb 0xFF", - List.of(HEX_NUMBER, HEX_NUMBER, HEX_NUMBER, HEX_NUMBER)) + List.of(HEX_NUMBER, HEX_NUMBER, HEX_NUMBER, HEX_NUMBER)), + Arguments.of("Long numbers", + "680L #80L 0x700L", + List.of(LONG_NUMBER, HEX_LONG_NUMBER, HEX_LONG_NUMBER)) ); } diff --git a/ownlang-parser/src/test/java/com/annimon/ownlang/parser/ProgramsTest.java b/ownlang-parser/src/test/java/com/annimon/ownlang/parser/ProgramsTest.java index 2de00393..eb32171b 100644 --- a/ownlang-parser/src/test/java/com/annimon/ownlang/parser/ProgramsTest.java +++ b/ownlang-parser/src/test/java/com/annimon/ownlang/parser/ProgramsTest.java @@ -50,7 +50,7 @@ public static void createStage() { @ParameterizedTest @MethodSource("data") - public void testProgram(InputSource inputSource) { + void testProgram(InputSource inputSource) { final StagesDataMap stagesData = new StagesDataMap(); try { testPipeline.perform(stagesData, inputSource); diff --git a/ownlang-parser/src/test/resources/expressions/binaryExpressionOnNumbers.own b/ownlang-parser/src/test/resources/expressions/binaryExpressionOnNumbers.own index 0b6be707..c7341593 100644 --- a/ownlang-parser/src/test/resources/expressions/binaryExpressionOnNumbers.own +++ b/ownlang-parser/src/test/resources/expressions/binaryExpressionOnNumbers.own @@ -14,6 +14,16 @@ def testMultiplicationOnNumbers() { assertEquals(30, 5 * (-2 * -3)) } +def testMultiplicationOverflowOnNumbers() { + assertNotEquals(1234567890000L, 1234567890 * 1000) + assertNotEquals(0xFFFFFF00, 0x100 * 0xFFFFFF) +} + +def testMultiplicationOnLongNumbers() { + assertEquals(1234567890000L, 1234567890 * 1000L) + assertEquals(0xFFFFFF00L, 0x100L * 0xFFFFFF) +} + def testDivisionOnNumbers() { assertEquals(3, 6 / 2) assertEquals(30, -900 / (60 / -2))