File tree Expand file tree Collapse file tree 2 files changed +3
-4
lines changed
kubeflow/training/constants Expand file tree Collapse file tree 2 files changed +3
-4
lines changed Original file line number Diff line number Diff line change 153
153
JAXJOB_PLURAL = "jaxjobs"
154
154
JAXJOB_CONTAINER = "jax"
155
155
JAXJOB_REPLICA_TYPES = REPLICA_TYPE_WORKER .lower ()
156
- JAXJOB_BASE_IMAGE = "docker.io/kubeflow/jaxjob-simple :latest"
156
+ JAXJOB_BASE_IMAGE = "docker.io/kubeflow/jaxjob-dist-spmd-mnist :latest"
157
157
158
158
# Dictionary to get plural, model, and container for each Job kind.
159
159
JOB_PARAMETERS = {
Original file line number Diff line number Diff line change @@ -155,7 +155,6 @@ def generate_jaxjob(
155
155
def generate_container () -> V1Container :
156
156
return V1Container (
157
157
name = CONTAINER_NAME ,
158
- image = "docker.io/kubeflow/jaxjob-simple:latest" ,
159
- command = ["python" , "train.py" ],
160
- resources = V1ResourceRequirements (limits = {"memory" : "2Gi" , "cpu" : "0.8" }),
158
+ image = os .getenv ("JAX_JOB_IMAGE" , "docker.io/kubeflow/jaxjob-dist-spmd-mnist:latest" ),
159
+ resources = V1ResourceRequirements (limits = {"memory" : "3Gi" , "cpu" : "1.2" }),
161
160
)
You can’t perform that action at this time.
0 commit comments