Add support for the Llama 3.1 70B Instruct model to facilitate testing on high‑performance accelerators.

2023-04-19 10:23:44 +00:00 · 2023-04-19 10:23:44 +00:00 · 837f8fb111
commit 837f8fb111
parent fdb7da5c9b
2 changed files with 41 additions and 0 deletions
--- a/examples/MODULE.bazel
+++ b/examples/MODULE.bazel
@ -102,6 +102,30 @@ filegroup(
 )
 use_repo(huggingface, "Meta-Llama-3.1-8B-Instruct")

+huggingface.model(
+    name = "Meta-Llama-3.1-70B-Instruct",
+    build_file_content = """\
+package(default_visibility = ["//visibility:public"])
+filegroup(
+    name = "model",
+    srcs = glob(["*.safetensors"]) + ["model.safetensors.index.json"],
+)
+
+filegroup(
+    name = "tokenizer",
+    srcs = ["tokenizer.json"],
+)
+""",
+    commit = "945c8663693130f8be2ee66210e062158b2a9693",
+    includes = [
+        "*.safetensors",
+        "model.safetensors.index.json",
+        "tokenizer.json",
+    ],
+    model = "meta-llama/Meta-Llama-3.1-70B-Instruct",
+)
+use_repo(huggingface, "Meta-Llama-3.1-70B-Instruct")
+
 huggingface.model(
    name = "TinyLlama-1.1B-Chat-v1.0",
    build_file_content = """\
--- a/examples/llama/BUILD.bazel
+++ b/examples/llama/BUILD.bazel
@ -34,6 +34,23 @@ native_binary(
    ],
 )

+native_binary(
+    name = "Llama-3.1-70B-Instruct",
+    src = ":llama",
+    args = [
+        "--model=$(location @Meta-Llama-3.1-70B-Instruct//:model.safetensors.index.json)",
+        "--tokenizer=$(location @Meta-Llama-3.1-70B-Instruct//:tokenizer)",
+        "--num-heads=64",
+        "--num-kv-heads=8",
+        "--rope-freq-base=500000",
+    ],
+    data = [
+        "@Meta-Llama-3.1-70B-Instruct//:model",
+        "@Meta-Llama-3.1-70B-Instruct//:model.safetensors.index.json",
+        "@Meta-Llama-3.1-70B-Instruct//:tokenizer",
+    ],
+)
+
 native_binary(
    name = "OpenLLaMA-3B",
    src = ":llama",