job = aiplatform.CustomTrainingJob(
display_name=JOB_NAME,
requirements=["tensorflow_datasets==4.6.0"],
# TODO: fill in the remaining arguments for the CustomTrainingJob function.
script_path="task.py", # Replace with the actual path to your training script
container_uri="gcr.io/cloud-aiplatform/training/tf-cpu.2-2:latest",# Replace with the appropriate container URI
model_serving_container_image_uri="us-docker.pkg.dev/vertex-ai/prediction/tf2-cpu.2-2:latest")
MODEL_DISPLAY_NAME = "kmnist-" + TIMESTAMP
# Start the training
model = job.run(
model_display_name=MODEL_DISPLAY_NAME,
replica_count=1,
accelerator_count=0,
machine_type="n1-standard-4",# Replace with the appropriate machine type
args=["--epochs", "10", "--learning-rate", "0.001"])
# TODO: fill in the remaining arguments to run the custom training job function.
may training is not completing it stopped and failed in 4.2 min i have tried almost 5 times but my lab is not completing please help me
my lab name is
Building and deploying CNN models with Vertex AI pipelines: Challenge Lab