Generate llama instead of downloading it

mila-iqia · Sep 3, 2024 · 7b4863e · 7b4863e
1 parent 544e44a
commit 7b4863e
Show file tree

Hide file tree

Showing 11 changed files with 1,129 additions and 6 deletions.
diff --git a/benchmarks/llm/benchfile.py b/benchmarks/llm/benchfile.py
@@ -1,3 +1,5 @@
+import tempfile
+from milabench.fs import XPath
 from milabench.pack import Package
 
 
@@ -38,6 +40,28 @@ class Llm(Package):
     prepare_script = "prepare.py"
 
     async def install(self):
+        llama3_dir = (XPath(__file__).resolve().parent / "llama3")
+        with tempfile.TemporaryDirectory() as tmp_dir:
+            tmp_dir = XPath(tmp_dir)
+            tmp_dir.clone_subtree(
+                "https://github.com/meta-llama/llama3.git",
+                "11817d47e1ba7a4959b025eb1ca308572e0e3963",
+            )
+            tmp_dir.merge_into(
+                llama3_dir,
+                manifest="\n".join(
+                    [
+                        "/llama/",
+                        "/requirements.txt",
+                    ]
+                )
+            )
+        # Fix conflict with tiktoken. As we only need llama/model.py, we don't
+        # need to care about a compatible tiktoken for the llama3 module
+        requirements = (llama3_dir / "requirements.txt").read_text().splitlines()
+        requirements = [l for l in requirements if not l.startswith("tiktoken==")]
+        (llama3_dir / "requirements.txt").write_text("\n".join(requirements))
+
         await super().install()  # super() call installs the requirements
 
     def build_run_plan(self):

diff --git a/benchmarks/llm/llama3/llama/__init__.py b/benchmarks/llm/llama3/llama/__init__.py
@@ -0,0 +1,6 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# This software may be used and distributed in accordance with the terms of the Llama 3 Community License Agreement.
+
+from .generation import Llama
+from .model import ModelArgs, Transformer
+from .tokenizer import Dialog, Tokenizer