Jump tables > branches

Kaweees · Kaweees · commit 00f06133a249 · 2025-07-20T06:11:17.000-07:00
diff --git a/assets/img/perceptron.png b/assets/img/perceptron.png
diff --git a/examples/train.zig b/examples/train.zig
@@ -14,17 +14,23 @@ pub fn main() !void {
     const NeuronType = kiwigrad.nn.Neuron(f64);
     const LayerType = kiwigrad.nn.Layer(f64);
     const MLPType = kiwigrad.nn.MLP(f64);
+    const ArrayType = kiwigrad.engine.Array(f64);
+    const TensorType = kiwigrad.engine.Tensor(f64);
 
     // Initialize allocators and components
     ValueType.init(alloc);
     NeuronType.init(alloc);
     LayerType.init(alloc);
     MLPType.init(alloc);
+    ArrayType.init(alloc);
+    TensorType.init(alloc);
     defer {
         ValueType.deinit();
         NeuronType.deinit();
         LayerType.deinit();
         MLPType.deinit();
+        ArrayType.deinit();
+        TensorType.deinit();
     }
 
     var sizes = [_]usize{ 3, 2, 1 };
@@ -50,6 +56,9 @@ pub fn main() !void {
         }
     }
 
+    const t1 = TensorType.new(&[_]f64{ 1, 2, 3, 4 });
+    std.debug.print("t1: {d:.4}\n", .{t1.data[0].data});
+
     // // outputs now contains 2 ValueType pointers (one for each neuron)
     // print("Layer output: {d:.4}\n", .{output.data});
 
diff --git a/src/engine/engine.zig b/src/engine/engine.zig
@@ -23,6 +23,11 @@ pub const UnaryType = enum {
     }
 };
 
+// pub const UnaryOp = struct {
+//     type: UnaryType,
+//     func: fn (Scalar) Scalar,
+// };
+
 pub const BinaryType = enum {
     add,
     sub,
@@ -40,4 +45,5 @@ pub const BinaryType = enum {
 };
 
 pub const Scalar = @import("scalar.zig").Scalar;
-// pub const Tensor = @import("tensor.zig").Tensor;
+pub const Array = @import("tensor.zig").Array;
+pub const Tensor = @import("tensor.zig").Tensor;
diff --git a/src/engine/scalar.zig b/src/engine/scalar.zig
@@ -26,8 +26,9 @@ const engine = @import("engine.zig");
 /// - Softmax
 pub fn Scalar(comptime T: type) type {
     // Check that T is a valid type
-    if (@typeInfo(T) != .int and @typeInfo(T) != .float) {
-        @compileError("Expected @int or @float type, got: " ++ @typeName(T));
+    switch (@typeInfo(T)) {
+        .int, .comptime_int, .float, .comptime_float => {},
+        else => @compileError("Expected @int or @float type, got: " ++ @typeName(T)),
     }
 
     return struct {
diff --git a/src/engine/tensor.zig b/src/engine/tensor.zig
@@ -0,0 +1,164 @@
+//! This file provides the autograd engine functionality for kiwigrad
+
+const std = @import("std");
+const engine = @import("engine.zig");
+
+/// Represents a multi-dimensional array
+pub fn Array(comptime T: type) type {
+    return struct {
+        const Self = @This();
+
+        /// The data
+        data: []T,
+        /// The shape of the array
+        shape: []usize,
+        /// The stride of the array
+        stride: []usize,
+        /// The number of dimensions of the array
+        dims: usize,
+        /// The number of elements in the array
+        size: usize,
+
+        var arena: std.heap.ArenaAllocator = undefined;
+
+        pub fn init(alloc: std.mem.Allocator) void {
+            arena = std.heap.ArenaAllocator.init(alloc);
+        }
+
+        /// Cleanup allocated memory
+        pub fn deinit() void {
+            arena.deinit();
+        }
+
+        /// Create a new Array
+        pub fn new(data: []T, shape: []usize, stride: []usize, dims: usize, size: usize) *Self {
+            const a = arena.allocator().create(Self) catch unreachable;
+            a.* = Self{
+                .data = data,
+                .shape = shape,
+                .stride = stride,
+                .dims = dims,
+                .size = size,
+            };
+            return a;
+        }
+
+        /// Find the element at the given coordinates
+        pub inline fn at(self: *Self, coords: []const usize) *T {
+            return self.data[self.index(coords)];
+        }
+
+        /// Find the index of the element at the given coordinates
+        pub inline fn index(self: *Self, coords: []const usize) usize {
+            if (coords.len != self.dims) {
+                std.debug.panic("Input size mismatch: {d} != {d}", .{ coords.len, self.dims });
+            }
+
+            var idx = 0;
+            for (coords, 0..) |coord, i| {
+                idx += coord * self.stride[i];
+            }
+            return idx;
+        }
+
+        /// Set the element at the given coordinates
+        pub inline fn set(self: *Self, coords: []const usize, value: T) void {
+            self.data[self.index(coords)] = value;
+        }
+    };
+}
+
+/// Represents an auto-differentiable Tensor value
+pub fn Tensor(comptime T: type) type {
+    const ArrayType = Array(T);
+    // Check that T is a valid type
+    switch (@typeInfo(T)) {
+        .int, .comptime_int, .float, .comptime_float => {},
+        else => @compileError("Expected @int or @float type, got: " ++ @typeName(T)),
+    }
+
+    return struct {
+        const Self = @This();
+        const BackpropFn = *const fn (self: *Self) void;
+
+        const Expr = union(engine.ExprType) {
+            nop: void,
+            unary: struct {
+                /// The unary operation that produced the value
+                op: engine.UnaryType,
+                backprop_fn: BackpropFn,
+                /// The children used to compute the value
+                prev: [1]*Self,
+            },
+            binary: struct {
+                /// The binary operation that produced the value
+                op: engine.BinaryType,
+                backprop_fn: BackpropFn,
+                /// The children used to compute the value
+                prev: [2]*Self,
+            },
+        };
+
+        /// The data
+        data: []Array(T),
+        /// The gradient
+        grad: []Array(T),
+        /// The expression that produced the value
+        expr: Expr,
+
+        /// The arena allocator
+        var arena: std.heap.ArenaAllocator = undefined;
+
+        /// Initialize the arena allocator
+        pub fn init(alloc: std.mem.Allocator) void {
+            arena = std.heap.ArenaAllocator.init(alloc);
+        }
+
+        /// Deinitialize the arena allocator
+        pub fn deinit() void {
+            arena.deinit();
+        }
+
+        /// Create a new Tensor value from array data
+        pub fn new(data: []const T) *Self {
+            const t = arena.allocator().create(Self) catch unreachable;
+
+            // Copy the input data to our own allocation
+            const tensor_data = arena.allocator().alloc(T, data.len) catch unreachable;
+            @memcpy(tensor_data, data);
+
+            // Create shape, stride for 1D tensor
+            const shape = arena.allocator().alloc(usize, 1) catch unreachable;
+            const stride = arena.allocator().alloc(usize, 1) catch unreachable;
+            shape[0] = data.len;
+            stride[0] = 1;
+
+            // Create the data array
+            const data_array = ArrayType.new(tensor_data, shape, stride, 1, data.len);
+
+            // Create gradient array (initialized to zeros)
+            const grad_data = arena.allocator().alloc(T, data.len) catch unreachable;
+            @memset(grad_data, 0);
+            const grad_shape = arena.allocator().alloc(usize, 1) catch unreachable;
+            const grad_stride = arena.allocator().alloc(usize, 1) catch unreachable;
+            grad_shape[0] = data.len;
+            grad_stride[0] = 1;
+            const grad_array = ArrayType.new(grad_data, grad_shape, grad_stride, 1, data.len);
+
+            // Create arrays to hold the Array values (not pointers)
+            const data_arrays = arena.allocator().alloc(ArrayType, 1) catch unreachable;
+            const grad_arrays = arena.allocator().alloc(ArrayType, 1) catch unreachable;
+            data_arrays[0] = data_array.*;
+            grad_arrays[0] = grad_array.*;
+
+            t.* = Self{ .data = data_arrays, .grad = grad_arrays, .expr = .{ .nop = {} } };
+
+            return t;
+        }
+
+        // /// Add two Tensors
+        // pub inline fn add(self: *Self, other: *Self) *Self {
+        //   return binary(self.data + other.data, .add, add_back, self, other);
+        // }
+    };
+}