Radix/examples/simple_layer/main.zig

const std = @import("std");

const async = @import("async");
const zml = @import("zml");

/// Model definition
const Layer = struct {
    bias: ?zml.Tensor = null,
    weight: zml.Tensor,

    pub fn forward(self: Layer, x: zml.Tensor) zml.Tensor {
        var y = self.weight.mul(x);
        if (self.bias) |bias| {
            y = y.add(bias);
        }
        return y;
    }
};

pub fn main() !void {
    try async.AsyncThread.main(std.heap.c_allocator, asyncMain);
}

pub fn asyncMain() !void {
    // Short lived allocations
    var gpa = std.heap.GeneralPurposeAllocator(.{}){};
    defer _ = gpa.deinit();
    const allocator = gpa.allocator();

    // Arena allocator for BufferStore etc.
    var arena_state = std.heap.ArenaAllocator.init(allocator);
    defer arena_state.deinit();
    const arena = arena_state.allocator();

    var context = try zml.Context.init();
    defer context.deinit();

    const platform = context.autoPlatform(.{});
    context.printAvailablePlatforms(platform);

    // Our weights and bias to use
    var weights = [4]f32{ 2.0, 2.0, 2.0, 2.0 };
    var bias = [4]f32{ 1.0, 2.0, 3.0, 4.0 };
    const input_shape = zml.Shape.init(.{4}, .f32);

    // We manually produce a BufferStore. You would not normally do that.
    // A BufferStore is usually created by loading model data from a file.
    var store: zml.aio.BufferStore = .init(allocator);
    defer store.deinit();
    try store.buffers.put(store.arena.allocator(), "weight", zml.HostBuffer.fromArrayPtr(&weights));
    try store.buffers.put(store.arena.allocator(), "bias", zml.HostBuffer.fromArrayPtr(&bias));

    // A clone of our model, consisting of shapes. We only need shapes for compiling.
    // We use the BufferStore to infer the shapes.
    var model_shapes = try zml.aio.populateModel(Layer, allocator, store);
    model_shapes.weight = model_shapes.weight.withSharding(.{-1});
    model_shapes.bias = model_shapes.bias.?.withSharding(.{-1});

    // Start compiling. This uses the inferred shapes from the BufferStore.
    // The shape of the input tensor, we have to pass in manually.
    var compilation = try async.async(zml.compileModel, .{ allocator, Layer.forward, model_shapes, .{input_shape}, platform });

    // Produce a bufferized weights struct from the fake BufferStore.
    // This is like the inferred shapes, but with actual values.
    // We will need to send those to the computation device later.
    var model_weights = try zml.aio.loadModelBuffers(Layer, model_shapes, store, arena, platform);
    defer zml.aio.unloadBuffers(&model_weights); // for good practice

    // Wait for compilation to finish
    const compiled = try compilation.await();

    // pass the model weights to the compiled module to create an executable module
    var executable = compiled.prepare(model_weights);
    defer executable.deinit();

    // prepare an input buffer
    // Here, we use zml.HostBuffer.fromSlice to show how you would create a HostBuffer
    // with a specific shape from an array.
    // For situations where e.g. you have an [4]f32 array but need a .{2, 2} input shape.
    var input = [4]f32{ 5.0, 5.0, 5.0, 5.0 };
    var input_buffer = try zml.Buffer.from(platform, zml.HostBuffer.fromSlice(input_shape, &input), .{});
    defer input_buffer.deinit();

    // call our executable module
    var result: zml.Buffer = executable.call(.{input_buffer});
    defer result.deinit();

    // fetch the result to CPU memory
    const cpu_result = try result.toHostAlloc(arena);
    std.debug.print(
        "\nThe result of {any} * {any} + {any} = {any}\n",
        .{ &weights, &input, &bias, cpu_result.items(f32) },
    );
}
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00			`const std = @import("std");`
Add Zig example programs for LLaMA, ModernBERT, and SimpleLayer, including a Bazel BUILD file for the LLaMA example. 2025-07-29 16:07:11 +00:00
Update docs and example scripts (including test files) to remove async helpers asynk, asyncc, awaitt, and await_ 2025-09-02 10:27:40 +00:00			`const async = @import("async");`
Add Zig example programs for LLaMA, ModernBERT, and SimpleLayer, including a Bazel BUILD file for the LLaMA example. 2025-07-29 16:07:11 +00:00			`const zml = @import("zml");`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00
			`/// Model definition`
			`const Layer = struct {`
			`bias: ?zml.Tensor = null,`
			`weight: zml.Tensor,`

			`pub fn forward(self: Layer, x: zml.Tensor) zml.Tensor {`
			`var y = self.weight.mul(x);`
			`if (self.bias) \|bias\| {`
			`y = y.add(bias);`
			`}`
			`return y;`
			`}`
			`};`

			`pub fn main() !void {`
Update docs and example scripts (including test files) to remove async helpers asynk, asyncc, awaitt, and await_ 2025-09-02 10:27:40 +00:00			`try async.AsyncThread.main(std.heap.c_allocator, asyncMain);`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00			`}`

			`pub fn asyncMain() !void {`
			`// Short lived allocations`
			`var gpa = std.heap.GeneralPurposeAllocator(.{}){};`
			`defer _ = gpa.deinit();`
			`const allocator = gpa.allocator();`

			`// Arena allocator for BufferStore etc.`
			`var arena_state = std.heap.ArenaAllocator.init(allocator);`
			`defer arena_state.deinit();`
			`const arena = arena_state.allocator();`

			`var context = try zml.Context.init();`
			`defer context.deinit();`

Update docs and Zig examples to demonstrate the new client creation flags API. 2023-11-09 12:31:11 +00:00			`const platform = context.autoPlatform(.{});`
Add new Zig example programs (benchmark, llama, loader, mnist, simple_layer) and include a test for the llama example. 2023-06-27 14:23:22 +00:00			`context.printAvailablePlatforms(platform);`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00
			`// Our weights and bias to use`
Add Zig example programs for LLaMA, ModernBERT, and SimpleLayer, including a Bazel BUILD file for the LLaMA example. 2025-07-29 16:07:11 +00:00			`var weights = [4]f32{ 2.0, 2.0, 2.0, 2.0 };`
			`var bias = [4]f32{ 1.0, 2.0, 3.0, 4.0 };`
			`const input_shape = zml.Shape.init(.{4}, .f32);`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00
			`// We manually produce a BufferStore. You would not normally do that.`
			`// A BufferStore is usually created by loading model data from a file.`
Update llama and simple_layer examples to use BufferStore tensor IDs, new CPU device count API, and fix zml.call tag hashing. 2025-08-22 17:55:03 +00:00			`var store: zml.aio.BufferStore = .init(allocator);`
			`defer store.deinit();`
Add Qwen3VL bf16 example implementation and tutorial docs, including BMP/JPG/PNG support via zignal library. 2025-12-31 12:46:11 +00:00			`try store.buffers.put(store.arena.allocator(), "weight", zml.HostBuffer.fromArrayPtr(&weights));`
			`try store.buffers.put(store.arena.allocator(), "bias", zml.HostBuffer.fromArrayPtr(&bias));`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00
			`// A clone of our model, consisting of shapes. We only need shapes for compiling.`
			`// We use the BufferStore to infer the shapes.`
Update llama and simple_layer examples to use BufferStore tensor IDs, new CPU device count API, and fix zml.call tag hashing. 2025-08-22 17:55:03 +00:00			`var model_shapes = try zml.aio.populateModel(Layer, allocator, store);`
Add sharding usage to the benchmark and simple_layer example programs. 2023-02-23 11:18:27 +00:00			`model_shapes.weight = model_shapes.weight.withSharding(.{-1});`
			`model_shapes.bias = model_shapes.bias.?.withSharding(.{-1});`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00
			`// Start compiling. This uses the inferred shapes from the BufferStore.`
			`// The shape of the input tensor, we have to pass in manually.`
Update docs and example scripts (including test files) to remove async helpers asynk, asyncc, awaitt, and await_ 2025-09-02 10:27:40 +00:00			`var compilation = try async.async(zml.compileModel, .{ allocator, Layer.forward, model_shapes, .{input_shape}, platform });`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00
			`// Produce a bufferized weights struct from the fake BufferStore.`
			`// This is like the inferred shapes, but with actual values.`
			`// We will need to send those to the computation device later.`
Update llama and simple_layer examples to use BufferStore tensor IDs, new CPU device count API, and fix zml.call tag hashing. 2025-08-22 17:55:03 +00:00			`var model_weights = try zml.aio.loadModelBuffers(Layer, model_shapes, store, arena, platform);`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00			`defer zml.aio.unloadBuffers(&model_weights); // for good practice`

			`// Wait for compilation to finish`
Update docs and example scripts (including test files) to remove async helpers asynk, asyncc, awaitt, and await_ 2025-09-02 10:27:40 +00:00			`const compiled = try compilation.await();`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00
			`// pass the model weights to the compiled module to create an executable module`
Update example programs (benchmark, llama, mnist, simple_layer) to use the new Exe API and reflect BaseExe allocation changes. 2023-10-10 11:12:34 +00:00			`var executable = compiled.prepare(model_weights);`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00			`defer executable.deinit();`

			`// prepare an input buffer`
			`// Here, we use zml.HostBuffer.fromSlice to show how you would create a HostBuffer`
			`// with a specific shape from an array.`
Add Zig example programs for LLaMA, ModernBERT, and SimpleLayer, including a Bazel BUILD file for the LLaMA example. 2025-07-29 16:07:11 +00:00			`// For situations where e.g. you have an [4]f32 array but need a .{2, 2} input shape.`
			`var input = [4]f32{ 5.0, 5.0, 5.0, 5.0 };`
Add examples demonstrating Buffer.from options, non‑blocking loading, and memory copy behavior. 2024-12-20 09:30:35 +00:00			`var input_buffer = try zml.Buffer.from(platform, zml.HostBuffer.fromSlice(input_shape, &input), .{});`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00			`defer input_buffer.deinit();`

			`// call our executable module`
			`var result: zml.Buffer = executable.call(.{input_buffer});`
			`defer result.deinit();`

			`// fetch the result to CPU memory`
			`const cpu_result = try result.toHostAlloc(arena);`
			`std.debug.print(`
Add Zig example programs for LLaMA, ModernBERT, and SimpleLayer, including a Bazel BUILD file for the LLaMA example. 2025-07-29 16:07:11 +00:00			`"\nThe result of {any} * {any} + {any} = {any}\n",`
			`.{ &weights, &input, &bias, cpu_result.items(f32) },`
Add initial documentation and example projects for ZML, covering how‑to guides, tutorials, and benchmark examples. 2023-01-03 10:21:07 +00:00			`);`
			`}`