Files
2025-04-30 15:53:51 +08:00

91 lines
2.7 KiB
Go

/*
* Copyright 2024 the KubeSphere Authors.
* Please refer to the LICENSE file in the root directory of the project.
* https://github.com/kubesphere/kubesphere/blob/master/LICENSE
*/
package workloads
import (
"context"
"fmt"
"strings"
"time"
batchv1 "k8s.io/api/batch/v1"
k8serr "k8s.io/apimachinery/pkg/api/errors"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
"k8s.io/apimachinery/pkg/runtime/schema"
"k8s.io/apimachinery/pkg/types"
"k8s.io/klog/v2"
runtimeclient "sigs.k8s.io/controller-runtime/pkg/client"
)
const retryTimes = 3
type JobRunner interface {
JobReRun(namespace, name, resourceVersion string) error
}
type jobRunner struct {
client runtimeclient.Client
}
func NewJobRunner(client runtimeclient.Client) JobRunner {
return &jobRunner{client: client}
}
func (r *jobRunner) JobReRun(namespace, jobName, resourceVersion string) error {
job := &batchv1.Job{}
if err := r.client.Get(context.Background(), types.NamespacedName{Namespace: namespace, Name: jobName}, job); err != nil {
return err
}
// do not rerun job if resourceVersion not match
if job.GetObjectMeta().GetResourceVersion() != resourceVersion {
err := k8serr.NewConflict(schema.GroupResource{
Group: job.GetObjectKind().GroupVersionKind().Group, Resource: "job",
}, jobName, fmt.Errorf("please apply your changes to the latest version and try again"))
klog.Warning(err)
return err
}
newJob := *job
newJob.ResourceVersion = ""
newJob.Status = batchv1.JobStatus{}
newJob.ObjectMeta.UID = ""
newJob.Annotations["revisions"] = strings.Replace(job.Annotations["revisions"], "running", "unfinished", -1)
delete(newJob.Spec.Selector.MatchLabels, "controller-uid")
delete(newJob.Spec.Selector.MatchLabels, "batch.kubernetes.io/controller-uid")
delete(newJob.Spec.Template.ObjectMeta.Labels, "controller-uid")
delete(newJob.Spec.Template.ObjectMeta.Labels, "batch.kubernetes.io/controller-uid")
delete(newJob.Spec.Template.ObjectMeta.Labels, "job-name")
delete(newJob.Spec.Template.ObjectMeta.Labels, "batch.kubernetes.io/job-name")
if err := r.deleteJob(namespace, jobName); err != nil {
klog.Errorf("failed to rerun job %s, reason: %s", jobName, err)
return fmt.Errorf("failed to rerun job %s", jobName)
}
var err error
for i := 0; i < retryTimes; i++ {
if err = r.client.Create(context.Background(), &newJob); err != nil {
time.Sleep(time.Second)
continue
}
break
}
if err != nil {
klog.Errorf("failed to rerun job %s, reason: %s", jobName, err)
return fmt.Errorf("failed to rerun job %s", jobName)
}
return nil
}
func (r *jobRunner) deleteJob(namespace, job string) error {
return r.client.Delete(context.Background(),
&batchv1.Job{ObjectMeta: metav1.ObjectMeta{Namespace: namespace, Name: job}})
}