Skip to content

Commit

Permalink
delete cm if job failed
Browse files Browse the repository at this point in the history
Signed-off-by: zibai <[email protected]>
  • Loading branch information
gujingit committed Mar 7, 2024
1 parent 70f4a13 commit ddea92f
Show file tree
Hide file tree
Showing 2 changed files with 13 additions and 6 deletions.
4 changes: 2 additions & 2 deletions pkg/util/kubeclient/configmap.go
Original file line number Diff line number Diff line change
Expand Up @@ -77,7 +77,7 @@ func CheckJobIsOwnedByUser(namespace, jobName string, jobType types.TrainingJobT
return true, nil
}

func CreateAppConfigmap(name, trainingType, namespace, configFileName, appInfoFileName, chartName, chartVersion string) (err error) {
func CreateAppConfigmap(name, namespace, configFileName, appInfoFileName, chartName, chartVersion string) (err error) {
data := map[string]string{
chartName: chartVersion,
}
Expand All @@ -97,7 +97,7 @@ func CreateAppConfigmap(name, trainingType, namespace, configFileName, appInfoFi
return err
}
configmap := obj.(*corev1.ConfigMap)
configmap.Name = fmt.Sprintf("%v-%v", name, trainingType)
configmap.Name = name
configmap.Namespace = namespace
configmap.Data = data
arenaConfiger := config.GetArenaConfiger()
Expand Down
15 changes: 11 additions & 4 deletions pkg/workflow/workflow.go
Original file line number Diff line number Diff line change
Expand Up @@ -141,8 +141,9 @@ func SubmitJob(name string, trainingType string, namespace string, values interf
if err != nil {
return err
}
err = kubeclient.CreateAppConfigmap(name,
trainingType,

configName := fmt.Sprintf("%v-%v", name, trainingType)
err = kubeclient.CreateAppConfigmap(configName,
namespace,
valueFileName,
appInfoFileName,
Expand All @@ -161,8 +162,14 @@ func SubmitJob(name string, trainingType string, namespace string, values interf
fmt.Printf("%s", result)
if err != nil {
// clean configmap
log.Infof("clean up the config map %s because creating application failed.", name)
log.Warnf("Please clean up the training job by using `arena delete %s --type %s`", name, trainingType)
delErr := kubeclient.DeleteConfigMap(namespace, configName)
if delErr != nil {
log.Errorf("Failed to clean up configmap %s in namespace %s, error: %s", configName, namespace, delErr.Error())
} else {
log.Infof("Successfully clean up the config map %s in namespace %s because creating application failed.", configName, namespace)
}

log.Warnf("Please clean up the %s job", name)
return err
}

Expand Down

0 comments on commit ddea92f

Please sign in to comment.