44export NAME=axlearn-img
55export COLOCATED_NAME=colocated-img
66export CKPT_BUCKET_NAME=<>
7+ export CLUSTER_NAME=<>
78
89axlearn gcp bundle --name=$NAME \
910 --bundler_spec=allow_dirty=True \
@@ -17,7 +18,7 @@ axlearn gcp bundle --name=$NAME \
1718
1819
1920
20- axlearn gcp launch run --cluster=mlperf-v5p \
21+ axlearn gcp launch run --cluster=$CLUSTER_NAME \
2122 --runner_name gke_tpu_pathways \
2223 --name=$NAME \
2324 --instance_type=tpu-v5p-32 \
@@ -29,3 +30,41 @@ axlearn gcp launch run --cluster=mlperf-v5p \
2930 --bundler_spec=target=tpu \
3031 --colocated_image=$COLOCATED_NAME \
3132 -- TPU_PREMAPPED_BUFFER_SIZE=34359738368 python3 test_benchmark.py --ckpt_path $CKPT_BUCKET_NAME
33+
34+
35+ #### Commands to build images separately ######
36+
37+ export NAME=lk-axlearnimg13
38+ export COLOCATED_NAME=colocated-image23
39+ export CKPT_BUCKET_NAME=<>
40+ export CLUSTER_NAME=<>
41+
42+ ### colocated image #####
43+ axlearn gcp bundle --name=$COLOCATED_NAME \
44+ --bundler_spec=allow_dirty=True \
45+ --bundler_type=artifactregistry \
46+ --bundler_spec=dockerfile=Dockerfile \
47+ --bundler_spec=image=$COLOCATED_NAME \
48+ --bundler_spec=target=colocated-python
49+
50+ ### axlearn image #####
51+ axlearn gcp bundle --name=$NAME \
52+ --bundler_spec=allow_dirty=True \
53+ --bundler_type=artifactregistry \
54+ --bundler_spec=dockerfile=Dockerfile \
55+ --bundler_spec=image=tpu \
56+ --bundler_spec=target=tpu
57+
58+ axlearn gcp launch run --cluster=$CLUSTER_NAME \
59+ --runner_name gke_tpu_pathways \
60+ --name=$NAME \
61+ --instance_type=tpu-v5p-32 \
62+ --num_replicas=1 \
63+ --bundler_spec=allow_dirty=True \
64+ --bundler_type=artifactregistry \
65+ --bundler_spec=image=tpu \
66+ --bundler_spec=dockerfile=Dockerfile \
67+ --bundler_spec=target=tpu \
68+ --colocated_image=$COLOCATED_NAME \
69+ -- TPU_PREMAPPED_BUFFER_SIZE=34359738368 python3 test_benchmark.py --ckpt_path $CKPT_BUCKET_NAME
70+
0 commit comments