mdbrnowski
diff --git a/‎main.py
+17 b/‎main.py
+17
diff --git a/‎semantic_listener.py
+245 b/‎semantic_listener.py
+245
diff --git a/‎test_main.py
+88 b/‎test_main.py
+88
diff --git a/‎tests/semantic/input_binary_operations.txt
+17 b/‎tests/semantic/input_binary_operations.txt
+17
diff --git a/‎tests/semantic/input_break.txt
+1 b/‎tests/semantic/input_break.txt
+1
@@ -4,6 +4,7 @@
 from generated.MyLexer import MyLexer
 from generated.MyParser import MyParser
 from ast_listener import ASTListener
+from semantic_listener import SemanticListener
 
 app = typer.Typer(no_args_is_help=True)
 
@@ -50,5 +51,21 @@ def ast(filename: str):
         ParseTreeWalker().walk(listener, tree)
 
 
+@app.command()
+def sem(filename: str):
+    """Semantic analysis"""
+    with open(filename, encoding="utf-8") as f:
+        string = f.read()
+
+    lexer = MyLexer(InputStream(string))
+    stream = CommonTokenStream(lexer)
+    parser = MyParser(stream)
+
+    tree = parser.program()
+    if parser.getNumberOfSyntaxErrors() == 0:
+        listener = SemanticListener()
+        ParseTreeWalker().walk(listener, tree)
+
+
 if __name__ == "__main__":
     app()
@@ -0,0 +1,245 @@
+from enum import Enum, auto
+from antlr4 import ParserRuleContext
+from generated.MyParser import MyParser
+from generated.MyParserListener import MyParserListener
+
+
+class Type(Enum):
+    INT = auto()
+    FLOAT = auto()
+    STRING = auto()
+    TBD = auto()  # to be determined (only during assignment)
+
+
+def is_plain_integer(ctx: ParserRuleContext) -> bool:
+    return isinstance(ctx, MyParser.SingleExpressionContext) and isinstance(
+        ctx.getChild(0), MyParser.IntContext
+    )
+
+
+class SemanticListener(MyParserListener):
+    """Checks break and continue statements, variable declarations,types and assignments."""
+
+    def __init__(self):
+        self.nested_loop_counter = 0
+        self.variables: dict[str, Type | None] = {}
+        self.expr_type: dict[
+            ParserRuleContext, Type | tuple
+        ] = {}  # values are either Type or (Type, int | None, int | None, ...)
+
+    # LOOP CHECKING
+
+    def enterForLoop(self, ctx: MyParser.ForLoopContext):
+        self.nested_loop_counter += 1
+
+    def exitForLoop(self, ctx: MyParser.ForLoopContext):
+        self.nested_loop_counter -= 1
+
+    def enterWhileLoop(self, ctx: MyParser.WhileLoopContext):
+        self.nested_loop_counter += 1
+
+    def exitWhileLoop(self, ctx: MyParser.WhileLoopContext):
+        self.nested_loop_counter -= 1
+
+    def enterBreak(self, ctx: MyParser.BreakContext):
+        if self.nested_loop_counter == 0:
+            ctx.parser.notifyErrorListeners(
+                "Break statement outside of loop", ctx.BREAK().getSymbol()
+            )
+
+    def enterContinue(self, ctx: MyParser.ContinueContext):
+        if self.nested_loop_counter == 0:
+            ctx.parser.notifyErrorListeners(
+                "Continue statement outside of loop", ctx.CONTINUE().getSymbol()
+            )
+
+    # VARIABLES & TYPES CHECKING
+
+    def enterRange(self, ctx: MyParser.RangeContext):
+        pass
+
+    def exitRange(self, ctx: MyParser.RangeContext):
+        pass
+
+    def enterComparison(self, ctx: MyParser.ComparisonContext):
+        pass
+
+    def exitComparison(self, ctx: MyParser.ComparisonContext):
+        children_types = {self.expr_type[ctx.getChild(i)] for i in [0, 2]}
+        if not (
+            children_types <= {Type.INT, Type.FLOAT}
+            or (
+                ctx.getChild(1).symbol.type in {MyParser.EQ, MyParser.NE}
+                and children_types <= {Type.STRING}
+            )
+        ):
+            ctx.parser.notifyErrorListeners(
+                "Incompatible types in a comparison", ctx.getChild(1).getSymbol()
+            )
+            self.expr_type[ctx] = None
+
+    def enterAssignment(self, ctx: MyParser.AssignmentContext):
+        if (
+            ctx.getChild(1).symbol.type == MyParser.ASSIGN
+            and isinstance(ctx.getChild(0), MyParser.IdContext)
+            and ctx.getChild(0).getText() not in self.variables
+        ):
+            # type is unknown at this point
+            self.variables[ctx.getChild(0).getText()] = Type.TBD
+
+    def exitAssignment(self, ctx: MyParser.AssignmentContext):
+        if (
+            ctx.getChild(1).symbol.type == MyParser.ASSIGN
+            and isinstance(ctx.getChild(0), MyParser.IdContext)
+            and self.variables[ctx.getChild(0).getText()] is Type.TBD
+        ):
+            # we finally know the type
+            if self.expr_type[ctx.getChild(2)] is Type.TBD:
+                ctx.parser.notifyErrorListeners(
+                    "Using a variable while declaring it is not allowed",
+                    ctx.getChild(1).getSymbol(),
+                )
+            self.variables[ctx.getChild(0).getText()] = self.expr_type[ctx.getChild(2)]
+
+    def exitBinaryExpression(self, ctx: MyParser.BinaryExpressionContext):
+        first = ctx.getChild(0)
+        second = ctx.getChild(2)
+        type_1 = self.expr_type[first]
+        type_2 = self.expr_type[second]
+        if ctx.op.type in [
+            MyParser.PLUS,
+            MyParser.MINUS,
+            MyParser.MULTIPLY,
+            MyParser.DIVIDE,
+        ]:
+            if {type_1, type_2} == {Type.INT}:
+                self.expr_type[ctx] = Type.INT
+            elif {type_1, type_2} <= {Type.FLOAT, Type.INT}:
+                self.expr_type[ctx] = Type.FLOAT
+            else:
+                ctx.parser.notifyErrorListeners(
+                    "Incompatible types in a binary operation",
+                    ctx.getChild(1).getSymbol(),
+                )
+                self.expr_type[ctx] = None
+        else:
+            if type_1 == type_2:
+                self.expr_type[ctx] = type_1
+            else:
+                ctx.parser.notifyErrorListeners(
+                    "Incompatible types in a matrix binary operation",
+                    ctx.getChild(1).getSymbol(),
+                )
+                self.expr_type[ctx] = None
+
+    def exitParenthesesExpression(self, ctx: MyParser.ParenthesesExpressionContext):
+        self.expr_type[ctx] = self.expr_type[ctx.getChild(1)]
+
+    def exitTransposeExpression(self, ctx: MyParser.TransposeExpressionContext):
+        matrix = ctx.getChild(0)
+        if (  # is a matrix
+            isinstance(self.expr_type[matrix], tuple)
+            and len(self.expr_type[matrix]) == 3
+        ):
+            self.expr_type[ctx] = tuple(self.expr_type[matrix][i] for i in (0, 2, 1))
+        else:
+            ctx.parser.notifyErrorListeners(
+                "Transpose operator can only be applied to matrices",
+                ctx.getChild(1).getSymbol(),
+            )
+            self.expr_type[ctx] = self.expr_type[matrix]
+
+    def exitMinusExpression(self, ctx: MyParser.MinusExpressionContext):
+        self.expr_type[ctx] = self.expr_type[ctx.getChild(1)]
+
+    def exitSingleExpression(self, ctx: MyParser.SingleExpressionContext):
+        self.expr_type[ctx] = self.expr_type[ctx.getChild(0)]
+
+    def exitSpecialMatrixFunction(self, ctx: MyParser.SpecialMatrixFunctionContext):
+        dimentions = ctx.children[2::2]
+        for dim in dimentions:
+            if self.expr_type[dim] != Type.INT:
+                ctx.parser.notifyErrorListeners(
+                    "Matrix dimentions must be integers", ctx.getChild(0).getSymbol()
+                )
+                self.expr_type[ctx] = None
+                return
+        type_dimentions = []
+        for dim in dimentions:
+            if is_plain_integer(dim):
+                type_dimentions.append(int(dim.getText()))
+            else:
+                type_dimentions.append(None)
+        self.expr_type[ctx] = (Type.INT, *type_dimentions)
+
+    def exitVector(self, ctx: MyParser.VectorContext):
+        elements = ctx.children[1::2]
+        for i in range(1, len(elements)):
+            if self.expr_type[elements[i]] != self.expr_type[elements[i - 1]]:
+                wrong_token = ctx.COMMA(i) or ctx.CLOSE_BRACKET_SQUARE()
+                ctx.parser.notifyErrorListeners(
+                    "Inconsistent types in a vector", wrong_token.getSymbol()
+                )
+                self.expr_type[ctx] = None
+                return
+        elem_type = self.expr_type[elements[1]]
+        if isinstance(elem_type, Type):
+            self.expr_type[ctx] = (elem_type, len(elements))
+        else:
+            self.expr_type[ctx] = (
+                elem_type[0],
+                len(elements),
+                *elem_type[1:],
+            )
+
+    def exitElementReference(self, ctx: MyParser.ElementReferenceContext):
+        references = ctx.children[2::2]
+        for ref in references:
+            if self.expr_type[ref] != Type.INT:
+                ctx.parser.notifyErrorListeners(
+                    "Indices must be integers", ctx.getChild(1).getSymbol()
+                )
+                self.expr_type[ctx] = None
+                return
+        id_type = self.expr_type[ctx.getChild(0)]
+        if not isinstance(id_type, tuple):
+            ctx.parser.notifyErrorListeners(
+                "Indexing can only be applied to tensors", ctx.getChild(1).getSymbol()
+            )
+            self.expr_type[ctx] = None
+            return
+        elif len(references) > len(id_type) - 1:
+            ctx.parser.notifyErrorListeners(
+                "Too many indices", ctx.getChild(1).getSymbol()
+            )
+            self.expr_type[ctx] = None
+            return
+        elif len(references) < len(id_type) - 1:
+            self.expr_type[ctx] = (id_type[0], *id_type[1 + len(references) :])
+        else:
+            self.expr_type[ctx] = id_type[0]
+
+        for i, ref in enumerate(references):
+            if is_plain_integer(ref) and id_type[i + 1] is not None:
+                if int(ref.getText()) >= id_type[i + 1]:
+                    ctx.parser.notifyErrorListeners(
+                        "Index out of bounds", ctx.getChild(1).getSymbol()
+                    )
+
+    def exitId(self, ctx: MyParser.IdContext):
+        if ctx.getText() not in self.variables:
+            ctx.parser.notifyErrorListeners(
+                f"Variable {ctx.getText()} not declared", ctx.ID().getSymbol()
+            )
+            self.expr_type[ctx] = None
+        else:
+            self.expr_type[ctx] = self.variables[ctx.getText()]
+
+    def exitInt(self, ctx: MyParser.IntContext):
+        self.expr_type[ctx] = Type.INT
+
+    def exitFloat(self, ctx: MyParser.FloatContext):
+        self.expr_type[ctx] = Type.FLOAT
+
+    def exitString(self, ctx: MyParser.StringContext):
+        self.expr_type[ctx] = Type.STRING
@@ -35,3 +35,91 @@ def test_ast(n):
     with open(f"tests/ast/output_{n}.txt", encoding="utf-8") as f:
         output = f.read()
     assert result.stdout == output
+
+
+def test_sem_error_break():
+    result = runner.invoke(app, ["sem", "tests/semantic/input_break.txt"])
+    assert result.exit_code == 0
+    assert "line 1" in result.stdout
+    assert "break" in result.stdout.lower()
+    assert result.stdout.count("line") == 1
+
+
+def test_sem_error_continue():
+    result = runner.invoke(app, ["sem", "tests/semantic/input_continue.txt"])
+    assert result.exit_code == 0
+    assert "line 1" in result.stdout
+    assert "continue" in result.stdout.lower()
+    assert result.stdout.count("line") == 1
+
+
+def test_sem_error_vector():
+    result = runner.invoke(app, ["sem", "tests/semantic/input_vector.txt"])
+    assert result.exit_code == 0
+    assert "line 1" in result.stdout
+    assert "line 3" in result.stdout
+    assert "line 7" in result.stdout
+    assert result.stdout.count("line") == 3
+    assert result.stdout.lower().count("vector") == 3
+
+
+def test_sem_error_variables():
+    result = runner.invoke(app, ["sem", "tests/semantic/input_variables.txt"])
+    assert result.exit_code == 0
+    assert "line 5" in result.stdout
+    assert "line 7" in result.stdout
+    assert result.stdout.count("line") == 2
+    assert result.stdout.lower().count("variable") == 2
+
+
+def test_sem_error_transpose():
+    result = runner.invoke(app, ["sem", "tests/semantic/input_transpose.txt"])
+    assert result.exit_code == 0
+    assert "line 7" in result.stdout
+    assert "transpose" in result.stdout.lower()
+    assert result.stdout.count("line") == 1
+
+
+def test_sem_error_special_matrix():
+    result = runner.invoke(app, ["sem", "tests/semantic/input_special_matrix.txt"])
+    assert result.exit_code == 0
+    assert "line 1" in result.stdout
+    assert "line 11" in result.stdout
+    assert result.stdout.count("line") == 2
+
+
+def test_sem_error_indexing():
+    result = runner.invoke(app, ["sem", "tests/semantic/input_indexing.txt"])
+    assert result.exit_code == 0
+    assert "line 5" in result.stdout
+    assert "line 6" in result.stdout
+    assert "line 7" in result.stdout
+    assert result.stdout.count("line") == 3
+
+
+def test_sem_error_indexing_bounds():
+    result = runner.invoke(app, ["sem", "tests/semantic/input_indexing_bounds.txt"])
+    assert result.exit_code == 0
+    assert "line 4" in result.stdout
+    assert "line 11" in result.stdout
+    assert "line 12" in result.stdout
+    assert result.stdout.count("line") == 3
+
+
+def test_sem_error_binary_operations():
+    result = runner.invoke(app, ["sem", "tests/semantic/input_binary_operations.txt"])
+    assert result.exit_code == 0
+    assert "line 7" in result.stdout
+    assert "line 8" in result.stdout
+    assert "line 14" in result.stdout
+    assert "line 16" in result.stdout
+    assert "line 17" in result.stdout
+    assert result.stdout.count("line") == 5
+
+
+def test_sem_error_comparisons():
+    result = runner.invoke(app, ["sem", "tests/semantic/input_comparisons.txt"])
+    assert result.exit_code == 0
+    assert "line 7" in result.stdout
+    assert "line 9" in result.stdout
+    assert result.stdout.count("line") == 2
@@ -0,0 +1,17 @@
+a1 = 1;
+a2 = 2;
+
+print a1 + a2;
+
+B = zeros(2);
+print a1 + B;
+print a1 .+ B;
+
+C = ones(2);
+print B .+ C;
+
+D = eye(3);
+print B .+ D;
+
+print 2 + "not ok";
+print 2 .+ "not ok";
@@ -0,0 +1 @@
+break;