Add Llama example showcasing the new func.call emission and function caching behavior.

2023-10-17 11:00:37 +00:00 · 2023-10-17 11:00:37 +00:00 · 37de7b9613
commit 37de7b9613
parent 7d36913b31
2 changed files with 4 additions and 8 deletions
--- a/examples/llama/llama.zig
+++ b/examples/llama/llama.zig
@ -180,10 +180,8 @@ pub const Llama = struct {
        var updated_kv_cache = kv_cache0;
        for (self.layers, 0..) |layer, i| {
            hidden, updated_kv_cache = zml.call(layer, .forward, .{ hidden, token_index, updated_kv_cache.atLayer(i) });
            hidden = hidden.withPartialTags(.{ .s, .d });
        }
-        // TODO: tags seem to be lost by `callFunc`.
+        const output = zml.call(self.norm, .forward, .{hidden});
        const output = zml.call(self.norm, .forward, .{hidden.withPartialTags(.{ .s, .d })});
        return .{ output, updated_kv_cache.reuseBuffer(kv_cache0) };
    }
--- a/examples/llama/main.zig
+++ b/examples/llama/main.zig
@ -21,12 +21,10 @@ const log = std.log.scoped(.llama);
 const show_mlir = true;
 pub const std_options = .{
-    .log_level = .err,
+    .log_level = .warn,
    .log_scope_levels = &[_]std.log.ScopeLevel{
-        .{ .scope = .pjrt, .level = if (show_mlir) .debug else .err },
+        .{ .scope = .zml_module, .level = if (show_mlir) .debug else .warn },
-        .{ .scope = .zml_module, .level = if (show_mlir) .debug else .err },
+        .{ .scope = .llama, .level = .info },
        .{ .scope = .zml, .level = if (show_mlir) .debug else .err },
        .{ .scope = .llama, .level = if (show_mlir) .debug else .info },
    },
 };