ZantFoundation
diff --git a/‎src/CodeGen/math_handler.zig‎
Lines changed: 125 additions & 1 deletion b/‎src/CodeGen/math_handler.zig‎
Lines changed: 125 additions & 1 deletion
diff --git a/‎src/CodeGen/shape_handler.zig‎
Lines changed: 110 additions & 2 deletions b/‎src/CodeGen/shape_handler.zig‎
Lines changed: 110 additions & 2 deletions
diff --git a/‎src/Core/Tensor/TensorMath/lib_elementWise_math/op_floor.zig‎
Lines changed: 40 additions & 0 deletions b/‎src/Core/Tensor/TensorMath/lib_elementWise_math/op_floor.zig‎
Lines changed: 40 additions & 0 deletions
@@ -92,6 +92,8 @@ pub fn write_math_op(writer: std.fs.File.Writer, node: *ReadyNode) !void {
         try write_elu(writer, node);
     } else if (std.mem.eql(u8, node.nodeProto.op_type, "Flatten")) {
         try write_flatten(writer, node);
+    } else if (std.mem.eql(u8, node.nodeProto.op_type, "Floor")) {
+        try write_floor(writer, node);
     } else if (std.mem.eql(u8, node.nodeProto.op_type, "Gather")) {
         try write_gather(writer, node);
     } else if (std.mem.eql(u8, node.nodeProto.op_type, "Gemm")) {
@@ -111,7 +113,7 @@ pub fn write_math_op(writer: std.fs.File.Writer, node: *ReadyNode) !void {
     } else if (std.mem.eql(u8, node.nodeProto.op_type, "Neg")) {
         try write_neg(writer, node);
     } else if (std.mem.eql(u8, node.nodeProto.op_type, "OneHot")) {
-        try writer.writeAll("// Handle OneHot\n");
+        try write_oneHot(writer, node);
     } else if (std.mem.eql(u8, node.nodeProto.op_type, "Pad")) {
         try write_pads(writer, node);
     } else if (std.mem.eql(u8, node.nodeProto.op_type, "ReduceMean")) {
@@ -366,6 +368,97 @@ inline fn write_BatchNormalization(writer: std.fs.File.Writer, node: *ReadyNode)
     });
 }
 
+inline fn write_oneHot(writer: std.fs.File.Writer, node: *ReadyNode) !void {
+    // https://onnx.ai/onnx/operators/onnx__OneHot.html
+    // INPUTS:
+    //      - indices (heterogeneous) - T1: Tensor of indices.
+    //      - depth (heterogeneous) - T2: Scalar tensor for depth.
+    //      - values (heterogeneous) - T3: Tensor of shape [off_value, on_value].
+    // OUTPUT:
+    //      - output (heterogeneous) - T3: Output tensor with one-hot encoding.
+    // ATTRIBUTES:
+    //      - axis - INT (default is -1): Axis along which to add the one-hot dimension.
+
+    var axis: i64 = -1; // Default axis per ONNX
+    for (node.nodeProto.attribute) |attr| {
+        if (std.mem.eql(u8, attr.name, "axis")) {
+            if (attr.type != AttributeType.INT) return error.InvalidAxisType;
+            axis = attr.i;
+        }
+    }
+
+    //----create indices string
+    var indices_string: []u8 = undefined;
+    defer allocator.free(indices_string);
+    if (node.inputs.items[0].?.tag == globals.TensorTag.INITIALIZER) {
+        indices_string = try std.mem.concat(allocator, u8, &[_][]const u8{
+            "@constCast(&param_lib.tensor_",
+            try utils.getSanitizedName(node.inputs.items[0].?.name),
+            ")",
+        });
+    } else {
+        indices_string = try std.mem.concat(allocator, u8, &[_][]const u8{
+            "@constCast(&tensor_",
+            try utils.getSanitizedName(node.inputs.items[0].?.name),
+            ")",
+        });
+    }
+
+    //----create depth string
+    var depth_string: []u8 = undefined;
+    defer allocator.free(depth_string);
+    if (node.inputs.items[1].?.tag == globals.TensorTag.INITIALIZER) {
+        depth_string = try std.mem.concat(allocator, u8, &[_][]const u8{
+            "@constCast(&param_lib.tensor_",
+            try utils.getSanitizedName(node.inputs.items[1].?.name),
+            ")",
+        });
+    } else {
+        depth_string = try std.mem.concat(allocator, u8, &[_][]const u8{
+            "@constCast(&tensor_",
+            try utils.getSanitizedName(node.inputs.items[1].?.name),
+            ")",
+        });
+    }
+
+    //----create values string
+    var values_string: []u8 = undefined;
+    defer allocator.free(values_string);
+    if (node.inputs.items[2].?.tag == globals.TensorTag.INITIALIZER) {
+        values_string = try std.mem.concat(allocator, u8, &[_][]const u8{
+            "@constCast(&param_lib.tensor_",
+            try utils.getSanitizedName(node.inputs.items[2].?.name),
+            ")",
+        });
+    } else {
+        values_string = try std.mem.concat(allocator, u8, &[_][]const u8{
+            "@constCast(&tensor_",
+            try utils.getSanitizedName(node.inputs.items[2].?.name),
+            ")",
+        });
+    }
+
+    _ = try writer.print(
+        \\    
+        \\
+        \\    tensMath.oneHot_lean(
+        \\        {s}, // T
+        \\        {s}, // indices
+        \\        {s}.data[0], // depth (scalare)
+        \\        {s}, // values
+        \\        {}, // axis
+        \\        &tensor_{s}, // output
+        \\    )
+    , .{
+        try utils.getTypeString(globals.tensorHashMap.getPtr(node.inputs.items[2].?.name).?.tensorProto.?.data_type), // T
+        indices_string, // indices
+        depth_string, // depth
+        values_string, // values
+        axis, // axis
+        try utils.getSanitizedName(node.outputs.items[0].name), // output
+    });
+}
+
 inline fn write_sub(writer: std.fs.File.Writer, node: *ReadyNode) !void {
     // https://onnx.ai/onnx/operators/onnx__Sub.html
     // INPUTS:
@@ -2177,6 +2270,37 @@ inline fn write_transpose(writer: std.fs.File.Writer, node: *ReadyNode) !void {
     });
 }
 
+inline fn write_floor(writer: std.fs.File.Writer, node: *ReadyNode) !void {
+    // https://onnx.ai/onnx/operators/onnx__Floor.html
+    // INPUTS:
+    //      - X (heterogeneous) - T: Input tensor
+    // OUTPUTS:
+    //      - Y (heterogeneous) - T: Output tensor with floor of input elements (If x is integral, +0, -0, NaN, or infinite, x itself is returned)
+
+    // Create input tensor string
+    var input_tensor_string: []u8 = undefined;
+    defer allocator.free(input_tensor_string);
+
+    if (node.inputs.items[0].?.tag == globals.TensorTag.INITIALIZER) {
+        input_tensor_string = try std.mem.concat(allocator, u8, &[_][]const u8{
+            "@constCast(&param_lib.tensor_",
+            try utils.getSanitizedName(node.inputs.items[0].?.name),
+            ")",
+        });
+    } else {
+        input_tensor_string = try std.mem.concat(allocator, u8, &[_][]const u8{ "&tensor_", try utils.getSanitizedName(node.inputs.items[0].?.name) });
+    }
+
+    _ = try writer.print(
+        \\
+        \\
+        \\    tensMath.floor_lean(T, {s}, &tensor_{s})
+    , .{
+        input_tensor_string,
+        try utils.getSanitizedName(node.outputs.items[0].name),
+    });
+}
+
 inline fn write_tanh(writer: std.fs.File.Writer, node: *ReadyNode) !void {
     // https://onnx.ai/onnx/operators/onnx__Tanh.html
     // INPUTS:
 
@@ -80,6 +80,9 @@ pub fn compute_output_shape(readyNode: *ReadyNode) !void {
     } else if (std.mem.eql(u8, readyNode.nodeProto.op_type, "Flatten")) {
         //https://onnx.ai/onnx/operators/onnx__Flatten.html
         try compute_flatten_output_shape(readyNode);
+    } else if (std.mem.eql(u8, readyNode.nodeProto.op_type, "Floor")) {
+        //https://onnx.ai/onnx/operators/onnx__Floor.html
+        try compute_floor_output_shape(readyNode);
     } else if (std.mem.eql(u8, readyNode.nodeProto.op_type, "Gather")) {
         try compute_gather_output_shape(readyNode);
     } else if (std.mem.eql(u8, readyNode.nodeProto.op_type, "Gemm")) {
@@ -100,8 +103,8 @@ pub fn compute_output_shape(readyNode: *ReadyNode) !void {
         //https://onnx.ai/onnx/operators/onnx__Neg.html
         try compute_neg_output_shape(readyNode);
     } else if (std.mem.eql(u8, readyNode.nodeProto.op_type, "OneHot")) {
-        // TODO
-        return error.OperationWIP;
+        //https://onnx.ai/onnx/operators/onnx__OneHot.html
+        try compute_oneHot_output_shape(readyNode);
     } else if (std.mem.eql(u8, readyNode.nodeProto.op_type, "Pad")) {
         //https://onnx.ai/onnx/operators/onnx__Pad.html
         try compute_pads_output_shape(readyNode);
@@ -438,6 +441,93 @@ inline fn compute_gemm_output_shape(readyNode: *ReadyNode) !void {
     readyNode.outputs.items[0].shape = shape;
 }
 
+inline fn compute_oneHot_output_shape(readyNode: *ReadyNode) !void {
+    std.debug.print("\n====== compute_oneHot_output_shape node: {s} ======\n", .{readyNode.nodeProto.name orelse "(unnamed)"});
+
+    var shape: []const i64 = undefined;
+
+    if (utils.getTensorShape(readyNode.outputs.items[0].name)) |tensorShape| {
+        shape = tensorShape;
+    } else {
+        // Verifica che ci siano esattamente 3 input: indices, depth, values
+        if (readyNode.inputs.items.len != 3) {
+            std.debug.print("\n ERROR: OneHot expects exactly 3 inputs, got {d}\n", .{readyNode.inputs.items.len});
+            return error.InvalidNumberOfInputs;
+        }
+
+        const indices = readyNode.inputs.items[0].?;
+        const depth_tensor = readyNode.inputs.items[1].?;
+        const values = readyNode.inputs.items[2].?;
+
+        std.debug.print("\n indices_shape: []i64 = {any}", .{indices.shape});
+        std.debug.print("\n depth_shape: []i64 = {any}", .{depth_tensor.shape});
+        std.debug.print("\n values_shape: []i64 = {any}", .{values.shape});
+
+        // Verifica che depth sia uno scalare (forma [] o [1])
+        const depth_shape_i64 = depth_tensor.shape;
+        const effective_depth_shape_i64 = if (depth_shape_i64.len == 0) &[_]i64{1} else depth_shape_i64;
+        if (effective_depth_shape_i64.len > 1 or effective_depth_shape_i64[0] != 1) {
+            std.debug.print("\n ERROR: depth must be a scalar, got shape {any}\n", .{effective_depth_shape_i64});
+            return error.InvalidDepthShape;
+        }
+
+        // Verifica che values abbia forma [2]
+        const values_shape_i64 = values.shape;
+        const effective_values_shape_i64 = if (values_shape_i64.len == 0) &[_]i64{1} else values_shape_i64;
+        if (effective_values_shape_i64.len != 1 or effective_values_shape_i64[0] != 2) {
+            std.debug.print("\n ERROR: values must have shape [2], got shape {any}\n", .{effective_values_shape_i64});
+            return error.InvalidValuesShape;
+        }
+
+        // Estrai il valore di depth
+        var depth: i64 = undefined;
+        if (depth_tensor.tensorProto != null and depth_tensor.tensorProto.?.int64_data != null) {
+            depth = depth_tensor.tensorProto.?.int64_data.?[0];
+        } else if (depth_tensor.tensorProto != null and depth_tensor.tensorProto.?.raw_data != null) {
+            const raw = depth_tensor.tensorProto.?.raw_data.?;
+            if (raw.len < @sizeOf(i64)) {
+                std.debug.print("\n ERROR: depth raw_data is too small to contain an i64\n", .{});
+                return error.InvalidDepthData;
+            }
+            depth = std.mem.readInt(i64, raw[0..@sizeOf(i64)], .little);
+        } else {
+            std.debug.print("\n ERROR: depth tensorProto is missing valid data\n", .{});
+            return error.DepthDataMissing;
+        }
+
+        // Verifica che depth sia positivo
+        if (depth <= 0) {
+            std.debug.print("\n ERROR: depth must be positive, got {d}\n", .{depth});
+            return error.InvalidDepthValue;
+        }
+
+        // Estrai l'attributo axis (default: -1)
+        var axis: i64 = -1;
+        for (readyNode.nodeProto.attribute) |attr| {
+            if (std.mem.eql(u8, attr.name, "axis")) {
+                if (attr.type != AttributeType.INT) {
+                    std.debug.print("\n ERROR: axis attribute must be INT, got type {any}\n", .{attr.type});
+                    return error.InvalidAttributeType;
+                }
+                axis = attr.i;
+                break;
+            }
+        }
+
+        const indices_shape_i64 = indices.shape;
+        const indices_shape_usize = try utils.i64SliceToUsizeSlice(indices_shape_i64);
+        defer allocator.free(indices_shape_usize);
+
+        const output_shape_usize = try tensorMath.get_oneHot_output_shape(indices_shape_usize, depth, axis);
+        defer allocator.free(output_shape_usize);
+
+        shape = try utils.usizeSliceToI64Slice(output_shape_usize);
+    }
+
+    readyNode.outputs.items[0].shape = shape;
+    std.debug.print("\n output_shape: []i64 = {any}", .{readyNode.outputs.items[0].shape});
+}
+
 inline fn compute_mul_output_shape(readyNode: *ReadyNode) !void {
     Codegen_log.info("\n====== compute_mul_output_shape node: {s} ======\n", .{readyNode.nodeProto.name.?});
 
@@ -1028,6 +1118,24 @@ inline fn compute_tanh_output_shape(readyNode: *ReadyNode) !void {
     readyNode.outputs.items[0].shape = shape;
 }
 
+inline fn compute_floor_output_shape(readyNode: *ReadyNode) !void {
+    const input = readyNode.inputs.items[0] orelse {
+        return error.InputTensorIsNull;
+    };
+
+    var shape: []const i64 = undefined;
+
+    if (utils.getTensorShape(readyNode.outputs.items[0].name)) |tensorShape| {
+        shape = tensorShape;
+    } else {
+        const input_shape = input.shape;
+        std.debug.print("\n input_shape: []i64 = {any}", .{input_shape});
+
+        shape = try utils.usizeSliceToI64Slice(try tensorMath.get_floor_output_shape(try utils.i64SliceToUsizeSlice(input_shape)));
+    }
+    readyNode.outputs.items[0].shape = shape;
+}
+
 inline fn compute_elu_output_shape(readyNode: *ReadyNode) !void {
     const input = readyNode.inputs.items[0] orelse {
         return error.InputTensorIsNull;
 
@@ -0,0 +1,40 @@
+const std = @import("std");
+const zant = @import("../../../../zant.zig");
+const pkg_allocator = zant.utils.allocator.allocator;
+
+const Tensor = zant.core.tensor.Tensor; // Import Tensor type
+
+pub fn get_floor_output_shape(input_shape: []const usize) ![]usize {
+    // Allocate and copy the input shape
+    const output_shape = try pkg_allocator.alloc(usize, input_shape.len);
+    errdefer pkg_allocator.free(output_shape);
+
+    std.mem.copyForwards(usize, output_shape, input_shape);
+
+    return output_shape;
+}
+
+pub fn floor(comptime T: anytype, input: *Tensor(T)) !Tensor(T) {
+    comptime if (!(std.meta.eql(T, f64) or std.meta.eql(T, f32) or std.meta.eql(T, f16))) {
+        @compileError("Unsupported type in floor_lean");
+    };
+
+    const output_shape = try get_floor_output_shape(input.shape);
+    var output = try Tensor(T).fromShape(&pkg_allocator, output_shape);
+    defer pkg_allocator.free(output_shape);
+    errdefer output.deinit();
+
+    try floor_lean(T, input, &output);
+    return output;
+}
+
+pub fn floor_lean(comptime T: anytype, input: *Tensor(T), output: *Tensor(T)) !void {
+    // Compute floor(x) for each element of the tensor
+    for (input.data, output.data) |in_val, *out_val| {
+        if (std.math.isNan(in_val) or std.math.isInf(in_val) or in_val == 0 or in_val == @trunc(in_val)) {
+            out_val.* = in_val;
+        } else {
+            out_val.* = std.math.floor(in_val);
+        }
+    }
+}