Skip to content

Commit

Permalink
Merge branch 'master' into bug/fix_gpu_resource_issue
Browse files Browse the repository at this point in the history
  • Loading branch information
k82cn authored May 15, 2019
2 parents 9463a9c + fd4e5a0 commit 20bc119
Show file tree
Hide file tree
Showing 17 changed files with 452 additions and 70 deletions.
3 changes: 3 additions & 0 deletions cmd/controllers/app/server.go
Original file line number Diff line number Diff line change
Expand Up @@ -40,6 +40,7 @@ import (

"volcano.sh/volcano/cmd/controllers/app/options"
vkclient "volcano.sh/volcano/pkg/client/clientset/versioned"
"volcano.sh/volcano/pkg/controllers/garbagecollector"
"volcano.sh/volcano/pkg/controllers/job"
"volcano.sh/volcano/pkg/controllers/queue"
)
Expand Down Expand Up @@ -83,10 +84,12 @@ func Run(opt *options.ServerOption) error {

jobController := job.NewJobController(kubeClient, kbClient, vkClient)
queueController := queue.NewQueueController(kubeClient, kbClient)
garbageCollector := garbagecollector.New(vkClient)

run := func(ctx context.Context) {
go jobController.Run(ctx.Done())
go queueController.Run(ctx.Done())
go garbageCollector.Run(ctx.Done())
<-ctx.Done()
}

Expand Down
5 changes: 5 additions & 0 deletions pkg/admission/admit_job.go
Original file line number Diff line number Diff line change
Expand Up @@ -86,6 +86,11 @@ func validateJob(job v1alpha1.Job, reviewResponse *v1beta1.AdmissionResponse) st
return fmt.Sprintf("'maxRetry' cannot be less than zero.")
}

if job.Spec.TTLSecondsAfterFinished != nil && *job.Spec.TTLSecondsAfterFinished < 0 {
reviewResponse.Allowed = false
return fmt.Sprintf("'ttlSecondsAfterFinished' cannot be less than zero.")
}

if len(job.Spec.Tasks) == 0 {
reviewResponse.Allowed = false
return fmt.Sprintf("No task specified in job spec")
Expand Down
13 changes: 13 additions & 0 deletions pkg/apis/batch/v1alpha1/job.go
Original file line number Diff line number Diff line change
Expand Up @@ -70,6 +70,15 @@ type JobSpec struct {
// Defaults to 3.
// +optional
MaxRetry int32 `json:"maxRetry,omitempty" protobuf:"bytes,8,opt,name=maxRetry"`

// ttlSecondsAfterFinished limits the lifetime of a Job that has finished
// execution (either Completed or Failed). If this field is set,
// ttlSecondsAfterFinished after the Job finishes, it is eligible to be
// automatically deleted. If this field is unset,
// the Job won't be automatically deleted. If this field is set to zero,
// the Job becomes eligible to be deleted immediately after it finishes.
// +optional
TTLSecondsAfterFinished *int32 `json:"ttlSecondsAfterFinished,omitempty" protobuf:"varint,9,opt,name=ttlSecondsAfterFinished"`
}

// VolumeSpec defines the specification of Volume, e.g. PVC
Expand Down Expand Up @@ -225,6 +234,10 @@ type JobState struct {
// Human-readable message indicating details about last transition.
// +optional
Message string `json:"message,omitempty" protobuf:"bytes,3,opt,name=message"`

// Last time the condition transit from one phase to another.
// +optional
LastTransitionTime metav1.Time `json:"lastTransitionTime,omitempty" protobuf:"bytes,4,opt,name=lastTransitionTime"`
}

// JobStatus represents the current status of a Job
Expand Down
8 changes: 7 additions & 1 deletion pkg/apis/batch/v1alpha1/zz_generated.deepcopy.go

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

283 changes: 283 additions & 0 deletions pkg/controllers/garbagecollector/garbagecollector.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,283 @@
/*
Copyright 2019 The Volcano Authors.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

package garbagecollector

import (
"fmt"
"time"

"github.com/golang/glog"

"k8s.io/apimachinery/pkg/api/errors"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
"k8s.io/apimachinery/pkg/util/wait"
"k8s.io/client-go/tools/cache"
"k8s.io/client-go/util/workqueue"
"k8s.io/kubernetes/pkg/controller"

"volcano.sh/volcano/pkg/apis/batch/v1alpha1"
vkver "volcano.sh/volcano/pkg/client/clientset/versioned"
vkinfoext "volcano.sh/volcano/pkg/client/informers/externalversions"
vkbatchinfo "volcano.sh/volcano/pkg/client/informers/externalversions/batch/v1alpha1"
vkbatchlister "volcano.sh/volcano/pkg/client/listers/batch/v1alpha1"
)

// GarbageCollector runs reflectors to watch for changes of managed API
// objects. Currently it only watches Jobs. Triggered by Job creation
// and updates, it enqueues Jobs that have non-nil `.spec.ttlSecondsAfterFinished`
// to the `queue`. The GarbageCollector has workers who consume `queue`, check whether
// the Job TTL has expired or not; if the Job TTL hasn't expired, it will add the
// Job to the queue after the TTL is expected to expire; if the TTL has expired, the
// worker will send requests to the API server to delete the Jobs accordingly.
// This is implemented outside of Job controller for separation of concerns, and
// because it will be extended to handle other finishable resource types.
type GarbageCollector struct {
vkClient vkver.Interface

jobInformer vkbatchinfo.JobInformer

// A store of jobs
jobLister vkbatchlister.JobLister
jobSynced func() bool

// queues that need to be updated.
queue workqueue.RateLimitingInterface
}

// New creates an instance of GarbageCollector
func New(vkClient vkver.Interface) *GarbageCollector {
jobInformer := vkinfoext.NewSharedInformerFactory(vkClient, 0).Batch().V1alpha1().Jobs()

gb := &GarbageCollector{
vkClient: vkClient,
jobInformer: jobInformer,
jobLister: jobInformer.Lister(),
jobSynced: jobInformer.Informer().HasSynced,
queue: workqueue.NewRateLimitingQueue(workqueue.DefaultControllerRateLimiter()),
}
jobInformer.Informer().AddEventHandler(cache.ResourceEventHandlerFuncs{
AddFunc: gb.addJob,
UpdateFunc: gb.updateJob,
})
return gb
}

// Run starts the worker to clean up Jobs.
func (gb *GarbageCollector) Run(stopCh <-chan struct{}) {
defer gb.queue.ShutDown()

glog.Infof("Starting garbage collector")
defer glog.Infof("Shutting down garbage collector")

go gb.jobInformer.Informer().Run(stopCh)
if !controller.WaitForCacheSync("garbage collector", stopCh, gb.jobSynced) {
return
}

go wait.Until(gb.worker, time.Second, stopCh)

<-stopCh
}

func (gb *GarbageCollector) addJob(obj interface{}) {
job := obj.(*v1alpha1.Job)
glog.V(4).Infof("Adding job %s/%s", job.Namespace, job.Name)

if job.DeletionTimestamp == nil && needsCleanup(job) {
gb.enqueue(job)
}
}

func (gb *GarbageCollector) updateJob(old, cur interface{}) {
job := cur.(*v1alpha1.Job)
glog.V(4).Infof("Updating job %s/%s", job.Namespace, job.Name)

if job.DeletionTimestamp == nil && needsCleanup(job) {
gb.enqueue(job)
}
}

func (gb *GarbageCollector) enqueue(job *v1alpha1.Job) {
glog.V(4).Infof("Add job %s/%s to cleanup", job.Namespace, job.Name)
key, err := controller.KeyFunc(job)
if err != nil {
glog.Errorf("couldn't get key for object %#v: %v", job, err)
return
}

gb.queue.Add(key)
}

func (gb *GarbageCollector) enqueueAfter(job *v1alpha1.Job, after time.Duration) {
key, err := controller.KeyFunc(job)
if err != nil {
glog.Errorf("couldn't get key for object %#v: %v", job, err)
return
}

gb.queue.AddAfter(key, after)
}

func (gb *GarbageCollector) worker() {
for gb.processNextWorkItem() {
}
}

func (gb *GarbageCollector) processNextWorkItem() bool {
key, quit := gb.queue.Get()
if quit {
return false
}
defer gb.queue.Done(key)

err := gb.processJob(key.(string))
gb.handleErr(err, key)

return true
}

func (gb *GarbageCollector) handleErr(err error, key interface{}) {
if err == nil {
gb.queue.Forget(key)
return
}

glog.Errorf("error cleaning up Job %v, will retry: %v", key, err)
gb.queue.AddRateLimited(key)
}

// processJob will check the Job's state and TTL and delete the Job when it
// finishes and its TTL after finished has expired. If the Job hasn't finished or
// its TTL hasn't expired, it will be added to the queue after the TTL is expected
// to expire.
// This function is not meant to be invoked concurrently with the same key.
func (gb *GarbageCollector) processJob(key string) error {
namespace, name, err := cache.SplitMetaNamespaceKey(key)
if err != nil {
return err
}

glog.V(4).Infof("Checking if Job %s/%s is ready for cleanup", namespace, name)
// Ignore the Jobs that are already deleted or being deleted, or the ones that don't need clean up.
job, err := gb.jobLister.Jobs(namespace).Get(name)
if errors.IsNotFound(err) {
return nil
}
if err != nil {
return err
}

if expired, err := gb.processTTL(job); err != nil {
return err
} else if !expired {
return nil
}

// The Job's TTL is assumed to have expired, but the Job TTL might be stale.
// Before deleting the Job, do a final sanity check.
// If TTL is modified before we do this check, we cannot be sure if the TTL truly expires.
// The latest Job may have a different UID, but it's fine because the checks will be run again.
fresh, err := gb.vkClient.BatchV1alpha1().Jobs(namespace).Get(name, metav1.GetOptions{})
if errors.IsNotFound(err) {
return nil
}
if err != nil {
return err
}
// Use the latest Job TTL to see if the TTL truly expires.
if expired, err := gb.processTTL(fresh); err != nil {
return err
} else if !expired {
return nil
}
// Cascade deletes the Jobs if TTL truly expires.
policy := metav1.DeletePropagationForeground
options := &metav1.DeleteOptions{
PropagationPolicy: &policy,
Preconditions: &metav1.Preconditions{UID: &fresh.UID},
}
glog.V(4).Infof("Cleaning up Job %s/%s", namespace, name)
return gb.vkClient.BatchV1alpha1().Jobs(fresh.Namespace).Delete(fresh.Name, options)
}

// processTTL checks whether a given Job's TTL has expired, and add it to the queue after the TTL is expected to expire
// if the TTL will expire later.
func (gb *GarbageCollector) processTTL(job *v1alpha1.Job) (expired bool, err error) {
// We don't care about the Jobs that are going to be deleted, or the ones that don't need clean up.
if job.DeletionTimestamp != nil || !needsCleanup(job) {
return false, nil
}

now := time.Now()
t, err := timeLeft(job, &now)
if err != nil {
return false, err
}

// TTL has expired
if *t <= 0 {
return true, nil
}

gb.enqueueAfter(job, *t)
return false, nil
}

// needsCleanup checks whether a Job has finished and has a TTL set.
func needsCleanup(j *v1alpha1.Job) bool {
return j.Spec.TTLSecondsAfterFinished != nil && isJobFinished(j)
}

func isJobFinished(job *v1alpha1.Job) bool {
return job.Status.State.Phase == v1alpha1.Completed ||
job.Status.State.Phase == v1alpha1.Failed ||
job.Status.State.Phase == v1alpha1.Terminated
}

func getFinishAndExpireTime(j *v1alpha1.Job) (*time.Time, *time.Time, error) {
if !needsCleanup(j) {
return nil, nil, fmt.Errorf("Job %s/%s should not be cleaned up", j.Namespace, j.Name)
}
finishAt, err := jobFinishTime(j)
if err != nil {
return nil, nil, err
}
finishAtUTC := finishAt.UTC()
expireAtUTC := finishAtUTC.Add(time.Duration(*j.Spec.TTLSecondsAfterFinished) * time.Second)
return &finishAtUTC, &expireAtUTC, nil
}

func timeLeft(j *v1alpha1.Job, since *time.Time) (*time.Duration, error) {
finishAt, expireAt, err := getFinishAndExpireTime(j)
if err != nil {
return nil, err
}
if finishAt.UTC().After(since.UTC()) {
glog.Warningf("Warning: Found Job %s/%s finished in the future. This is likely due to time skew in the cluster. Job cleanup will be deferred.", j.Namespace, j.Name)
}
remaining := expireAt.UTC().Sub(since.UTC())
glog.V(4).Infof("Found Job %s/%s finished at %v, remaining TTL %v since %v, TTL will expire at %v", j.Namespace, j.Name, finishAt.UTC(), remaining, since.UTC(), expireAt.UTC())
return &remaining, nil
}

// jobFinishTime takes an already finished Job and returns the time it finishes.
func jobFinishTime(finishedJob *v1alpha1.Job) (metav1.Time, error) {
if finishedJob.Status.State.LastTransitionTime.IsZero() {
return metav1.Time{}, fmt.Errorf("unable to find the time when the Job %s/%s finished", finishedJob.Namespace, finishedJob.Name)
}
return finishedJob.Status.State.LastTransitionTime, nil
}
Loading

0 comments on commit 20bc119

Please sign in to comment.