Skip to content

Commit 51e9034

Browse files
committed
update and pin modal images
1 parent a2b4cdc commit 51e9034

2 files changed

Lines changed: 32 additions & 25 deletions

File tree

src/discord-cluster-manager/modal_runner.py

Lines changed: 31 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -8,41 +8,48 @@
88
# Create a stub for the Modal app
99
# IMPORTANT: This has to stay in separate file or modal breaks
1010
app = App("discord-bot-runner")
11-
cuda_version = "12.4.0"
11+
cuda_version = "12.8.0"
1212
flavor = "devel"
13-
operating_sys = "ubuntu22.04"
13+
operating_sys = "ubuntu24.04"
1414
tag = f"{cuda_version}-{flavor}-{operating_sys}"
1515

1616
# Move this to another file later:
1717
cuda_image = (
18-
Image.from_registry(f"nvidia/cuda:{tag}", add_python="3.11")
18+
Image.from_registry(f"nvidia/cuda:{tag}", add_python="3.12")
1919
.apt_install(
2020
"git",
21-
"gcc-11",
22-
"g++-11",
23-
"clang-11", # note i skip a step
21+
"gcc-13",
22+
"g++-13",
23+
"clang-18",
2424
)
2525
.pip_install(
26-
"ninja",
27-
"packaging",
28-
"wheel",
29-
"torch",
30-
"numpy",
31-
"triton",
32-
"jax[cuda12]",
33-
"jax2torch",
34-
"tinygrad",
26+
"ninja~=1.11",
27+
"wheel~=0.45",
28+
"requests~=2.32.4",
29+
"packaging~=25.0",
30+
"numpy~=2.3",
3531
)
36-
.run_commands(
37-
"update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-11 100 "
38-
+ "--slave /usr/bin/g++ g++ /usr/bin/g++-11",
39-
# "apt update",
40-
# "apt -y install clang-10", # this should be clang-10 but I can't get it to work yet
41-
#
42-
"git clone https://github.com/HazyResearch/ThunderKittens.git",
43-
# "cd /ThunderKittens && pwd && python setup.py install",
32+
.pip_install(
33+
"torch~=2.7",
34+
"torchvision~=0.22",
35+
"torchaudio~=2.7",
36+
index_url="https://download.pytorch.org/whl/cu128"
37+
)
38+
# other frameworks
39+
.pip_install(
40+
"jax[cuda12]==0.5.3", # 0.6 want's cudnn 9.8 in conflict with torch 2.7
41+
"jax2torch==0.0.7",
42+
"tinygrad~=0.10",
43+
)
44+
# nvidia cuda packages
45+
.pip_install(
46+
"nvidia-cupynumeric~=25.3",
47+
"nvidia-cutlass-dsl~=4.0",
48+
"cuda-core[cu12]~=0.3",
49+
"cuda-python[all]==12.8",
50+
#"nvmath-python[cu12]~=0.4",
51+
#"numba-cuda[cu12]~=0.15",
4452
)
45-
.pip_install("requests")
4653
)
4754

4855
cuda_image = cuda_image.add_local_python_source(

src/discord-cluster-manager/modal_runner_archs.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
# Modal apps on specific devices. We will fix this later.
33
from modal_runner import app, cuda_image, modal_run_config
44

5-
gpus = ["T4", "L4", "A100-80GB", "H100!"]
5+
gpus = ["T4", "L4", "A100-80GB", "H100!", "B200"]
66
for gpu in gpus:
77
gpu_slug = gpu.lower().split("-")[0].strip("!")
88
app.function(gpu=gpu, image=cuda_image, name=f"run_cuda_script_{gpu_slug}", serialized=True)(

0 commit comments

Comments
 (0)