RobEin
diff --git a/‎PythonLexer.g4
+2 b/‎PythonLexer.g4
+2
diff --git a/‎PythonParser.g4
+2-1 b/‎PythonParser.g4
+2-1
diff --git a/‎README.md
+1-1 b/‎README.md
+1-1
diff --git a/‎port_CSharp/AssemblyInfo.cs
+2-1 b/‎port_CSharp/AssemblyInfo.cs
+2-1
diff --git a/‎port_CSharp/README.md
+4-4 b/‎port_CSharp/README.md
+4-4
diff --git a/‎port_CSharp/csgrun4py.cs
-35 b/‎port_CSharp/csgrun4py.cs
-35
diff --git a/‎port_CSharp/grun4py.cs
+143 b/‎port_CSharp/grun4py.cs
+143
diff --git a/‎port_Dart/README.md
+1-1 b/‎port_Dart/README.md
+1-1
diff --git a/‎port_Dart/bin/dartgrun4py.dart ‎port_Dart/bin/grun4py.dart b/‎port_Dart/bin/dartgrun4py.dart ‎port_Dart/bin/grun4py.dart
diff --git a/‎port_Dart/pubspec.yaml
+1-1 b/‎port_Dart/pubspec.yaml
+1-1
diff --git a/‎port_Go/README.md
+1-1 b/‎port_Go/README.md
+1-1
diff --git a/‎port_Go/gogrun4py.go
-44 b/‎port_Go/gogrun4py.go
-44
@@ -28,7 +28,9 @@ THE SOFTWARE.
   */
 
 lexer grammar PythonLexer;
+
 options { superClass=PythonLexerBase; }
+
 tokens {
     // the following tokens are only for compatibility with the PythonLexerBase class
     LSQB, RSQB, LBRACE, RBRACE
 
@@ -26,8 +26,9 @@ THE SOFTWARE.
  * Developed by : Robert Einhorn
  */
 
+// Tiny Python based on: https://docs.python.org/3.8/reference/grammar.html
+parser grammar PythonParser;
 
-parser grammar PythonParser; // Tiny Python based on: https://docs.python.org/3.8/reference/grammar.html
 options { tokenVocab=PythonLexer; }
 
 // ANTLR4 grammar for a tiny Python
 
@@ -1,7 +1,7 @@
 # Tiny Python &nbsp; [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
 A considerably stripped down Python grammar for a starter Python (or a Python-like) parser or even for educational purposes. 
 
-The ANTLR4 parser grammar is based on the last "traditional" [Python 3.8 grammar](https://docs.python.org/3.8/reference/grammar.html) which not yet written in [PEG](https://en.wikipedia.org/wiki/Parsing_expression_grammar).
+The ANTLR4 parser grammar is based on the last "traditional" [Python 3.8 grammar](https://docs.python.org/3.8/reference/grammar.html) which not yet written in [PEG](https://peps.python.org/pep-0617/).
 
 
 ### Related links:
 
@@ -1 +1,2 @@
-[assembly: CLSCompliant(true)] 
+[assembly: CLSCompliant(true)]
+
@@ -2,13 +2,13 @@
 
 #### Prerequisites:
 - Installed [ANTLR4-tools](https://github.com/antlr/antlr4/blob/master/doc/getting-started.md#getting-started-the-easy-way-using-antlr4-tools)
-- Installed [.NET Framework](https://dotnet.microsoft.com/en-us/download/dotnet-framework)
+- Installed [.NET](https://dotnet.microsoft.com/en-us/download)
 
 
 #### Command line example for Windows:
- - first create a C# project called csgrun4py then copy the two grammar files and example.py to this directory:
+ - first create a C# project called grun4py then copy the two grammar files and example.py to this directory:
 ```bash
-    dotnet new console -o . -n csgrun4py -f net8.0
+    dotnet new console -o . -n grun4py -f net9.0
     del program.cs
     dotnet add package Antlr4.Runtime.Standard --version 4.13.1
 ```
@@ -22,7 +22,7 @@
 antlr4 -Dlanguage=CSharp PythonLexer.g4
 antlr4 -Dlanguage=CSharp PythonParser.g4
 dotnet build
-dotnet run example.py --no-build
+dotnet run example.py --no-builddotnet run example.py --no-build
 ```
 
 
 
@@ -0,0 +1,143 @@
+// ******* GRUN (Grammar Unit Test) for Python *******
+
+using System;
+using System.Text.RegularExpressions;
+using System.Text;
+using Antlr4.Runtime;
+
+namespace grun4py
+{
+    internal static class Program
+    {
+        public static int Main(string[] args)
+        {
+            if (args.Length < 1)
+            {
+                Console.Error.WriteLine("Error: Please provide an input file path");
+                return 1;
+            }
+
+            try
+            {
+                var filePath = args[0];
+                var input = GetEncodedInputStreamByPythonComment(filePath);
+                var lexer = new PythonLexer(input);
+                var tokens = new CommonTokenStream((ITokenSource)lexer);
+                var parser = new PythonParser(tokens);
+
+                tokens.Fill(); // Test the lexer grammar
+                foreach (IToken t in tokens.GetTokens())
+                {
+                    Console.WriteLine(GetTokenMetaDataWithTokenName(t));
+                }
+
+                parser.file_input(); // Test the parser grammar
+                return parser.NumberOfSyntaxErrors;
+
+            }
+            catch (Exception ex)
+            {
+                Console.Error.WriteLine($"Error: {ex.Message}");
+                return 1; // Error occurred, returning non-zero exit code
+            }
+        }
+
+        private static string GetTokenMetaDataWithTokenName(IToken token)
+        {
+            string tokenText = ReplaceSpecialCharacters(token.Text);
+            string tokenName = token.Type == TokenConstants.EOF ? "EOF" : PythonLexer.DefaultVocabulary.GetDisplayName(token.Type);
+            string channelText = token.Channel == TokenConstants.DefaultChannel ? 
+                                 "" :
+                                 $"channel={PythonLexer.channelNames[token.Channel]},";
+
+            // Modified format: [@TokenIndex,StartIndex:StopIndex='Text',<TokenName>,channel=ChannelName,Line:Column]
+            return $"[@{token.TokenIndex},{token.StartIndex}:{token.StopIndex}='{tokenText}',<{tokenName}>,{channelText}{token.Line}:{token.Column}]";
+        }
+
+        private static string ReplaceSpecialCharacters(string text)
+        {
+            return text.Replace("\n", @"\n")
+                       .Replace("\r", @"\r")
+                       .Replace("\t", @"\t")
+                       .Replace("\f", @"\f");
+
+        }
+
+        public static ICharStream? GetEncodedInputStreamByPythonComment(string filePath)
+        {
+            string encodingName = "";
+            var ws_commentPattern = new Regex(@"^[ \t\f]*(#.*)?$");
+
+            try
+            {
+                using FileStream fs = new(filePath, FileMode.Open, FileAccess.Read); // read in binary mode
+                using StreamReader reader = new(fs, Encoding.ASCII);
+                for (int lineCount = 0; lineCount < 2; lineCount++)
+                {
+                    string? line = reader.ReadLine();
+                    if (line == null)
+                    {
+                        break; // EOF reached
+                    }
+
+                    if (ws_commentPattern.IsMatch(line)) // WS? + COMMENT? found
+                    {
+                        encodingName = GetEncodingName(line);
+                        if (encodingName != "") // encoding found
+                        {
+                            break;
+                        }
+                    }
+                    else
+                    {
+                        break; // statement or backslash found (line is not empty, not whitespace(s), not comment)
+                    }
+                }
+            }
+            catch (Exception)
+            {
+                // Console.WriteLine($"An error occurred: {e.Message}");
+            }
+
+            const string DEFAULT_PYTHON_ENCODING = "utf-8"; // default encoding for Python source code
+            if (encodingName == "")
+            {
+                encodingName = DEFAULT_PYTHON_ENCODING;
+            }
+
+            try // encoding test for ANTLR4
+            {
+                return CharStreams.fromPath(filePath, Encoding.GetEncoding(encodingName));
+            }
+            catch (Exception)
+            {
+                return CharStreams.fromPath(filePath, Encoding.GetEncoding(DEFAULT_PYTHON_ENCODING));
+            }
+
+        }
+
+        public static string GetEncodingName(string commentText) // https://peps.python.org/pep-0263/#defining-the-encoding
+        {
+            var encodingCommentPattern = new Regex(@"^[ \t\f]*#.*?coding[:=][ \t]*([-_.a-zA-Z0-9]+)");
+            var match = encodingCommentPattern.Match(commentText);
+            if (match.Success)
+            {
+                string encodingName = match.Groups[1].Value;
+
+                // normalize encoding name
+                var encodingMap = new Dictionary<string, string>
+                {
+                    { "cp1252", "latin1" },
+                    { "latin-1", "latin1" },
+                    { "iso-8859-1", "latin1" }
+                    // more encoding pairs
+                };
+
+                return encodingMap.TryGetValue(encodingName.ToLower(), out var normalizedEncodingName)
+                    ? normalizedEncodingName
+                    : encodingName;
+            }
+            return "";
+        }
+    }
+}
@@ -23,7 +23,7 @@ Windows:
 ```bash
 antlr4 -Dlanguage=Dart PythonLexer.g4
 antlr4 -Dlanguage=Dart PythonParser.g4
-dart dartgrun4py.dart example.py
+dart grun4py.dart example.py
 ```
 
 #### Related link:
 
@@ -1,4 +1,4 @@
-name: dartgrun4py
+name: grun4py
 
 environment:
   sdk: ^3.4.4
 
@@ -30,7 +30,7 @@ Windows:
 ```bash
 go generate ./...
 go mod tidy
-go run gogrun4py.go example.py
+go run grun4py.go example.py
 ```
 
 #### Related link:
Original file line number	Diff line number	Diff line change
`@@ -1 +1,2 @@`
`1`		`-[assembly: CLSCompliant(true)]`
	`1`	`+[assembly: CLSCompliant(true)]`
	`2`	`+`
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-name: dartgrun4py`
	`1`	`+name: grun4py`
`2`	`2`
`3`	`3`	`environment:`
`4`	`4`	`sdk: ^3.4.4`