Skip to content

Commit

Permalink
Fix incorrect TensorBoard images. (#1109)
Browse files Browse the repository at this point in the history
Signed-off-by: Syulin7 <[email protected]>
  • Loading branch information
Syulin7 authored Jul 22, 2024
1 parent c9dbc8f commit 9064896
Show file tree
Hide file tree
Showing 8 changed files with 11 additions and 12 deletions.
2 changes: 1 addition & 1 deletion charts/cron-tfjob/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -48,7 +48,7 @@ tfjob:
imagePullPolicy: Always

useTensorboard: false
tensorboardImage: registry.cn-zhangjiakou.aliyuncs.com/kube-ai/tensorflow:1.5.0-devel
tensorboardImage: registry.cn-zhangjiakou.aliyuncs.com/acs/tensorflow:1.12.0-devel
tensorboardImagePullpolicy: Always
tensorboardServiceType: NodePort
tensorboardResources: {}
Expand Down
2 changes: 1 addition & 1 deletion charts/etjob/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,7 @@ shmSize: 2Gi
privileged: false

useTensorboard: false
tensorboardImage: registry.cn-zhangjiakou.aliyuncs.com/tensorflow-samples/tensorflow:1.5.0-devel
tensorboardImage: registry.cn-zhangjiakou.aliyuncs.com/acs/tensorflow:1.12.0-devel
tensorboardImagePullpolicy: Always
tensorboardServiceType: NodePort

Expand Down
2 changes: 1 addition & 1 deletion charts/mpijob/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,7 @@ shmSize: 2Gi
privileged: false

useTensorboard: false
tensorboardImage: registry.cn-zhangjiakou.aliyuncs.com/acs/tensorflow:1.5.0-devel
tensorboardImage: registry.cn-zhangjiakou.aliyuncs.com/acs/tensorflow:1.12.0-devel
tensorboardImagePullpolicy: Always
tensorboardServiceType: NodePort

Expand Down
2 changes: 1 addition & 1 deletion charts/pytorchjob/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@ gitImage: registry.cn-zhangjiakou.aliyuncs.com/acs/git-sync:v3.3.5
privileged: false

useTensorboard: false
tensorboardImage: registry.cn-zhangjiakou.aliyuncs.com/kube-ai/tensorflow:1.5.0-devel
tensorboardImage: registry.cn-zhangjiakou.aliyuncs.com/acs/tensorflow:1.12.0-devel
tensorboardImagePullpolicy: Always
tensorboardServiceType: NodePort

Expand Down
2 changes: 1 addition & 1 deletion charts/tfjob/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -40,7 +40,7 @@ gitImage: registry.cn-zhangjiakou.aliyuncs.com/acs/git-sync:v3.3.5
imagePullPolicy: Always

useTensorboard: false
tensorboardImage: registry.cn-zhangjiakou.aliyuncs.com/kube-ai/tensorflow:1.5.0-devel
tensorboardImage: registry.cn-zhangjiakou.aliyuncs.com/acs/tensorflow:1.12.0-devel
tensorboardImagePullpolicy: Always
tensorboardServiceType: NodePort
tensorboardResources: {}
Expand Down
3 changes: 1 addition & 2 deletions pkg/apis/training/common.go
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,5 @@ var DefaultCommonSubmitArgs = types.CommonSubmitArgs{
}

var DefaultSubmitTensorboardArgs = types.SubmitTensorboardArgs{
TensorboardImage: "registry.cn-zhangjiakou.aliyuncs.com/acs/tensorflow:1.12.0-devel",
TrainingLogdir: "/training_logs",
TrainingLogdir: "/training_logs",
}
6 changes: 3 additions & 3 deletions pkg/apis/types/submit_tfjob.go
Original file line number Diff line number Diff line change
Expand Up @@ -107,9 +107,9 @@ type SubmitTFJobArgs struct {

// SubmitTensorboardArgs is used to store tensorborad information
type SubmitTensorboardArgs struct {
UseTensorboard bool `yaml:"useTensorboard"` // --tensorboard
TensorboardImage string `yaml:"tensorboardImage"` // --tensorboardImage
TrainingLogdir string `yaml:"trainingLogdir"` // --logdir
UseTensorboard bool `yaml:"useTensorboard"` // --tensorboard
TensorboardImage string `yaml:"tensorboardImage,omitempty"` // --tensorboardImage
TrainingLogdir string `yaml:"trainingLogdir"` // --logdir
HostLogPath string `yaml:"hostLogPath"`
IsLocalLogging bool `yaml:"isLocalLogging"`
}
Expand Down
4 changes: 2 additions & 2 deletions pkg/argsbuilder/submit_tensorboard.go
Original file line number Diff line number Diff line change
Expand Up @@ -85,9 +85,9 @@ func (s *SubmitTensorboardArgsBuilder) AddCommandFlags(command *cobra.Command) {
s.subBuilders[name].AddCommandFlags(command)
}
command.Flags().BoolVar(&s.args.UseTensorboard, "tensorboard", false, "enable tensorboard")
command.Flags().StringVar(&s.args.TensorboardImage, "tensorboardImage", "registry.cn-zhangjiakou.aliyuncs.com/acs/tensorflow:1.12.0-devel", "the docker image for tensorboard")
command.Flags().StringVar(&s.args.TensorboardImage, "tensorboardImage", "", "the docker image for tensorboard")
_ = command.Flags().MarkDeprecated("tensorboardImage", "please use --tensorboard-image instead")
command.Flags().StringVar(&s.args.TensorboardImage, "tensorboard-image", "registry.cn-zhangjiakou.aliyuncs.com/acs/tensorflow:1.12.0-devel", "the docker image for tensorboard")
command.Flags().StringVar(&s.args.TensorboardImage, "tensorboard-image", "", "the docker image for tensorboard")
command.Flags().StringVar(&s.args.TrainingLogdir, "logdir", "/training_logs", "the training logs dir, default is /training_logs")
}

Expand Down

0 comments on commit 9064896

Please sign in to comment.