cxfidc
diff --git a/‎python/pom.xml
+2-1 b/‎python/pom.xml
+2-1
diff --git a/‎python/python3-without-actions/README.md
+43 b/‎python/python3-without-actions/README.md
+43
diff --git a/‎python/python3-without-actions/pom.xml
+53 b/‎python/python3-without-actions/pom.xml
+53
diff --git a/‎python/python3-without-actions/src/IndentationErrorListener.java
+32 b/‎python/python3-without-actions/src/IndentationErrorListener.java
+32
diff --git a/‎python/python3-without-actions/src/LexerWithIndentDedentInjector.java
+223 b/‎python/python3-without-actions/src/LexerWithIndentDedentInjector.java
+223
@@ -18,7 +18,8 @@
 		<module>python3-js</module>
 		<module>python3-py</module>
 		<module>python3-ts</module>
-		<module>python3_without_actions</module>
+		<module>python3-without-actions</module>
 		<module>python3alt</module>
+		<module>tiny-python</module>
 	</modules>
 </project>
@@ -0,0 +1,43 @@
+# Python 3 parser without grammar actions &nbsp; [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
+
+A Python 3 parser that based on the Bart Kiers's Python 3.3 grammar with an improved indentation handling outside of the grammar with the following advantages:
+-  more informative token metadata
+-  reusable code for grammar with embedded action and without action
+-  detection of various indentation errors
+
+#### Some indentation errors with message:
+```python
+ i = 1 # first line begins with space
+#  line 1:1	IndentationError: unexpected indent
+
+
+if i == 1:
+j = 
+#  line 2:0	IndentationError: expected an indented block
+
+
+if i == 1:
+    j = 0
+        k = 0
+#  line 3:8	IndentationError: unexpected indent
+
+
+if i == 1:
+    j = 0
+  k = 0
+#  line 3:2	IndentationError: unindent does not match any outer indentation level
+```
+
+## How to use
+```bash
+antlr4 Python3.g4
+javac *.java
+java Main test.py
+```
+
+## Related links
+[The Python 3.3.7 Language Reference](https://docs.python.org/3.3/reference/grammar.html)
+
+[Bart Kiers's Python 3.3 ANTLR4 grammar](https://github.com/bkiers/python3-parser)
+
+
@@ -0,0 +1,53 @@
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+	xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+	<modelVersion>4.0.0</modelVersion>
+	<artifactId>python3-without-actions</artifactId>
+	<packaging>jar</packaging>
+	<name>Python 3 grammar without embedded actions</name>
+	<parent>
+		<groupId>org.antlr.grammars</groupId>
+		<artifactId>pythonparent</artifactId>
+		<version>1.0-SNAPSHOT</version>
+		<relativePath>../pom.xml</relativePath>
+	</parent>
+	<build>
+		<plugins>
+			<plugin>
+				<groupId>org.antlr</groupId>
+				<artifactId>antlr4-maven-plugin</artifactId>
+				<version>${antlr.version}</version>
+				<configuration>
+					<sourceDirectory>${basedir}</sourceDirectory>
+					<grammars>Python3.g4</grammars>
+					<visitor>true</visitor>
+					<listener>true</listener>
+				</configuration>
+				<executions>
+					<execution>
+						<goals>
+							<goal>antlr4</goal>
+						</goals>
+					</execution>
+				</executions>
+			</plugin>
+			<plugin>
+	            <groupId>org.apache.maven.plugins</groupId>
+	            <artifactId>maven-compiler-plugin</artifactId>
+	            <executions>
+	                <execution>
+	                    <id>default-compile</id>
+	                    <phase>none</phase>
+	                </execution>
+	            </executions>
+        	</plugin>
+			<plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-compiler-plugin</artifactId>
+                <configuration>
+                    <source>11</source>
+                    <target>11</target>
+                </configuration>
+            </plugin>
+		</plugins>
+	</build>
+</project>
@@ -0,0 +1,32 @@
+import org.antlr.v4.runtime.*;
+
+public class IndentationErrorListener extends BaseErrorListener {
+    private boolean isFirstTime = true;
+
+    @Override
+    public void syntaxError(Recognizer<?, ?> recognizer,
+                            Object offendingSymbol,
+                            int line, int charPositionInLine,
+                            String msg,
+                            RecognitionException e) {
+
+        if (isFirstTime) {
+            isFirstTime = false;
+            System.out.println();
+            System.err.println("ERROR:");
+        }
+
+        if (msg.startsWith(LexerWithIndentDedentInjector.TEXT_LEXER)) { // this is a custom error message from the lexer contained a pattern
+            System.err.println(msg.substring(LexerWithIndentDedentInjector.TEXT_LEXER.length())); // displaying the lexer error message without the pattern
+        } else { // this is a parser error message
+            String startOfMessage = "line " + line + ":" + charPositionInLine + "\t ";
+            if (msg.startsWith("missing INDENT")) {
+                System.err.println(startOfMessage + "IndentationError: expected an indented block"); // displaying the modified parser error message
+            } else if (msg.startsWith("extraneous input '<" + LexerWithIndentDedentInjector.TEXT_INSERTED_INDENT)) {
+                System.err.println(startOfMessage + "IndentationError: unexpected indent"); // displaying the modified parser error message
+            } else {
+                System.err.println(startOfMessage + "at " + offendingSymbol + ": " + msg); // displaying the original parser error message
+            }
+        }
+    }
+}
@@ -0,0 +1,223 @@
+/*
+/*
+ * The MIT License (MIT)
+ *
+ * Copyright (c) 2019 Robert Einhorn
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ *
+ * Project      : Python3 Indent/Dedent handler for ANTLR4 grammars
+ *                https://github.com/antlr/grammars-v4/tree/master/python/python3-without-actions
+ * Developed by : Robert Einhorn, [email protected]
+ */
+
+import org.antlr.v4.runtime.*;
+
+// *************************************************************************************************************
+// **** THE FOLLOWING IMPORT SECTION ALSO CAN BE USED IN THE SECTION OF THE @lexer::header{} IN THE GRAMMAR ****
+// *************************************************************************************************************
+import java.util.*;
+
+public class LexerWithIndentDedentInjector extends Python3Lexer { //*** https://www.antlr.org/api/Java/org/antlr/v4/runtime/Lexer.html
+    public LexerWithIndentDedentInjector(CharStream input) {
+        super(input);
+    }
+
+    // *******************************************************************************************************
+    // **** THE FOLLOWING SECTION ALSO CAN BE USED IN THE SECTION OF THE @lexer::members{} IN THE GRAMMAR ****
+    // *******************************************************************************************************
+    // The stack that keeps track of the indentation lengths
+    private final Stack<Integer> indentLengths = new Stack<>() {{ push(0); }}; // initializing with default 0 indentation length
+    // A queue where extra tokens are pushed on
+    private final Deque<Token> pendingTokens = new ArrayDeque<>();
+    // An integer that stores the type of the last appended token to the token stream
+    private int lastAppendedTokenType;
+
+    // The amount of opened braces, brackets and parenthesis
+    private int opened = 0;
+
+    // Was there space char in the indentations?
+    private boolean wasSpaceIndentation = false;
+    // Was there TAB char in the indentations?
+    private boolean wasTabIndentation = false;
+
+    // A string list that stores the lexer warnings
+    private List<String> warnings = new ArrayList<>();
+    // A string list that stores the lexer error messages
+    private List<String> errors = new ArrayList<>();
+
+    // Patterns for the custom error listener to recognize error messages
+    public static final String TEXT_LEXER = "lexer --> ";
+    public static final String TEXT_INSERTED_INDENT = "inserted INDENT";
+
+    @Override
+    public Token nextToken() {
+        final boolean atVeryFirstCharWhichIsSpaceOrTAB = getCharIndex() == 0 && List.of((int) ' ', (int) '\t').contains(_input.LA(1));
+        Token currentToken;
+
+        while (true) {
+            currentToken = super.nextToken(); // get a token from the inputstream
+            this.insertLeadingTokens(atVeryFirstCharWhichIsSpaceOrTAB, currentToken.getType(), currentToken.getStartIndex());
+            switch (currentToken.getType()) {
+                case OPEN_PAREN:
+                case OPEN_BRACK:
+                case OPEN_BRACE:
+                    this.opened++;
+                    this.pendingTokens.addLast(currentToken);  // insert the current open parentheses or square bracket or curly brace token
+                    break;
+                case CLOSE_PAREN:
+                case CLOSE_BRACK:
+                case CLOSE_BRACE:
+                    this.opened--;
+                    this.pendingTokens.addLast(currentToken);  // insert the current close parentheses or square bracket or curly brace token
+                    break;
+                case NEWLINE:
+                    if (this.opened > 0) {                             //*** https://docs.python.org/3/reference/lexical_analysis.html#implicit-line-joining
+                        continue;  // We're inside an implicit line joining section, skip the NEWLINE token
+                    } else {
+                        switch (_input.LA(1) /* next symbol */) {    //*** https://www.antlr.org/api/Java/org/antlr/v4/runtime/IntStream.html#LA(int)
+                            case '\r':
+                            case '\n':
+                            case '\f':
+                            case '#':                                  //*** https://docs.python.org/3/reference/lexical_analysis.html#blank-lines
+                                continue;  // We're on a blank line or before a comment, skip the NEWLINE token
+                            default:
+                                this.pendingTokens.addLast(currentToken); // insert the current NEWLINE token
+                                this.insertIndentDedentTokens();       //*** https://docs.python.org/3/reference/lexical_analysis.html#indentation
+                        }
+                    }
+                    break;
+                case EOF:
+                    if ( !this.indentLengths.isEmpty() ) {
+                        this.insertTrailingTokens(); // indentLengths stack wil be empty
+                        this.checkSpaceAndTabIndentation();
+                        this.pendingTokens.addLast(currentToken); // insert the current EOF token
+                    }
+                    break;
+                default:
+                    this.pendingTokens.addLast(currentToken); // insert the current token
+            }
+            break; // exit from the loop
+        }
+        this.lastAppendedTokenType = this.pendingTokens.peekFirst().getType(); // save the token type before removing from the deque for the trailing tokens inserting later
+        return this.pendingTokens.pollFirst(); // append a token to the token stream until the first returning EOF
+    }
+
+    private void insertLeadingTokens(boolean atVeryFirstCharWhichIsSpaceOrTAB, int type, int startIndex) {
+        if (atVeryFirstCharWhichIsSpaceOrTAB &&   // We're at the first line of the input starting with a space or TAB
+            !List.of(NEWLINE, EOF).contains(type) // and within that the first token that is visible (comments were skiped and OPEN_PAREN, OPEN_BRACK OPEN_BRACE cannot be the first token)
+            ) {                                   // We need to insert a NEWLINE and an INDENT token before the first token to raise an 'unexpected indent' error by the parser later
+            this.insertToken(0, startIndex - 1, "<inserted leading NEWLINE>" + " ".repeat(startIndex), NEWLINE, 1, 0);
+            this.insertToken(startIndex, startIndex - 1, "<" + TEXT_INSERTED_INDENT + ", " + this.getIndentationDescription(startIndex) + ">", Python3Parser.INDENT, 1, startIndex);
+            this.indentLengths.push(startIndex);
+        }
+    }
+
+    private void insertIndentDedentTokens() {
+        final int currentIndentLength = this.getIndentationLength(getText());
+        int previousIndentLength = this.indentLengths.peek();
+
+        if (currentIndentLength > previousIndentLength) { // insert an INDENT token
+            this.insertToken("<" + TEXT_INSERTED_INDENT + ", " + this.getIndentationDescription(currentIndentLength) + ">", Python3Parser.INDENT);
+            this.indentLengths.push(currentIndentLength);
+        } else if (currentIndentLength < previousIndentLength) {
+            do {   // More than 1 DEDENT token may be inserted
+                this.indentLengths.pop();
+                previousIndentLength = this.indentLengths.peek();
+                if (currentIndentLength <= previousIndentLength) {
+                    this.insertToken("<inserted DEDENT, " + this.getIndentationDescription(previousIndentLength) + ">", Python3Parser.DEDENT);
+                } else {
+                    this.insertToken("<inserted (I N C O N S I S T E N T!) DEDENT, " + this.getIndentationDescription(currentIndentLength) + ">", Python3Parser.DEDENT);
+                    this.errors.add(TEXT_LEXER + "line " + getLine() + ":" + getCharPositionInLine() + "\t IndentationError: unindent does not match any outer indentation level");
+                }
+            } while (currentIndentLength < previousIndentLength);
+        }
+    }
+
+    private void insertTrailingTokens() {
+        if ( !List.of(NEWLINE, Python3Parser.DEDENT).contains(this.lastAppendedTokenType) ) { // If the last token was not NEWLINE or DEDENT then
+            this.insertToken("<inserted trailing NEWLINE>", NEWLINE); // insert an extra trailing NEWLINE token that serves as the end of the statement
+        }
+
+        this.indentLengths.removeElementAt(0); // Remove the default 0 indentation length
+        while ( !this.indentLengths.isEmpty() ) { // Now insert as much trailing DEDENT tokens as needed
+            this.insertToken("<inserted trailing DEDENT, " + this.getIndentationDescription(this.indentLengths.pop()) + ">", Python3Parser.DEDENT);
+        }
+    }
+
+    private String getIndentationDescription(int lengthOfIndent) {
+        return "length=" + lengthOfIndent + ", level=" + (this.indentLengths.size());
+    }
+
+    private void insertToken(String text, int type) {
+        final int startIndex = _tokenStartCharIndex + getText().length(); //*** https://www.antlr.org/api/Java/org/antlr/v4/runtime/Lexer.html#_tokenStartCharIndex
+        this.insertToken(startIndex, startIndex - 1, text, type, getLine(), getCharPositionInLine());
+    }
+
+    private void insertToken(int startIndex, int stopIndex, String text, int type, int line, int charPositionInLine) {
+        CommonToken token = new CommonToken(_tokenFactorySourcePair, type, DEFAULT_TOKEN_CHANNEL, startIndex, stopIndex); //*** https://www.antlr.org/api/Java/org/antlr/v4/runtime/CommonToken.html
+        token.setText(text);
+        token.setLine(line);
+        token.setCharPositionInLine(charPositionInLine);
+        this.pendingTokens.addLast(token);
+    }
+
+    // Calculates the indentation of the provided spaces, taking the
+    // following rules into account:
+    //
+    // "Tabs are replaced (from left to right) by one to eight spaces
+    //  such that the total number of characters up to and including
+    //  the replacement is a multiple of eight [...]"
+    //
+    //  -- https://docs.python.org/3.1/reference/lexical_analysis.html#indentation
+    private int getIndentationLength(String textOfMatchedNEWLINE) {
+        int count = 0;
+
+        for (char ch : textOfMatchedNEWLINE.toCharArray()) {
+            switch (ch) {
+                case ' ': // A normal space char
+                    this.wasSpaceIndentation = true;
+                    count++;
+                    break;
+                case '\t':
+                    this.wasTabIndentation = true;
+                    count += 8 - (count % 8);
+                    break;
+            }
+        }
+        return count;
+    }
+
+    private void checkSpaceAndTabIndentation() {
+        if (this.wasSpaceIndentation && this.wasTabIndentation) {
+            this.warnings.add("Mixture of space and tab were used for indentation.");
+        }
+    }
+
+    public List<String> getWarnings() { // can be called from a grammar embedded action also
+        return this.warnings;
+    }
+
+    public List<String> getErrorMessages() { // can be called from a grammar embedded action also
+        return this.errors;
+    }
+}