diff --git a/.gitmodules b/.gitmodules index e837ed9a..fc9806ff 100644 --- a/.gitmodules +++ b/.gitmodules @@ -1,4 +1,4 @@ [submodule "ThunderKittens"] path = ThunderKittens - url = https://github.com/HazyResearch/ThunderKittens.git + url = https://github.com/HaoZhang-Ethan/ThunderKittens.git branch = bvm-single-ctrl-pre-new-warps diff --git a/ThunderKittens b/ThunderKittens index 664c108d..7bd4b5c8 160000 --- a/ThunderKittens +++ b/ThunderKittens @@ -1 +1 @@ -Subproject commit 664c108d16f12707a73d3072ab525f26fb2b4f62 +Subproject commit 7bd4b5c889803c8cbc33fc4dc8223f5c74fc78eb diff --git a/megakernels/scripts/generate.py b/megakernels/scripts/generate.py index 2b43f943..f31b518b 100644 --- a/megakernels/scripts/generate.py +++ b/megakernels/scripts/generate.py @@ -26,7 +26,8 @@ class ScriptConfig(pydra.Config): - model: str = "meta-llama/Llama-3.2-1B-Instruct" + # model: str = "meta-llama/Llama-3.2-1B-Instruct" + model: str = "/home/fit/qianxueh/WORK/alchem/zhanghao/Mega/Models/Meta-Llama-3.2-1B-Instruct" device: str = "cuda:0" prompt: str = "tell me a funny joke about cookies" chat: bool = False