2018-01-09 18:57:14 +00:00
/ *
Copyright 2015 The Kubernetes Authors .
Licensed under the Apache License , Version 2.0 ( the "License" ) ;
you may not use this file except in compliance with the License .
You may obtain a copy of the License at
http : //www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing , software
distributed under the License is distributed on an "AS IS" BASIS ,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND , either express or implied .
See the License for the specific language governing permissions and
limitations under the License .
* /
package cmd
import (
"errors"
"fmt"
"math"
"strings"
"time"
"github.com/jonboulle/clockwork"
"github.com/spf13/cobra"
corev1 "k8s.io/api/core/v1"
policyv1beta1 "k8s.io/api/policy/v1beta1"
apierrors "k8s.io/apimachinery/pkg/api/errors"
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
"k8s.io/apimachinery/pkg/fields"
2018-03-06 22:33:18 +00:00
"k8s.io/apimachinery/pkg/labels"
2018-01-09 18:57:14 +00:00
"k8s.io/apimachinery/pkg/runtime"
"k8s.io/apimachinery/pkg/types"
"k8s.io/apimachinery/pkg/util/json"
"k8s.io/apimachinery/pkg/util/sets"
"k8s.io/apimachinery/pkg/util/strategicpatch"
"k8s.io/apimachinery/pkg/util/wait"
"k8s.io/client-go/kubernetes"
restclient "k8s.io/client-go/rest"
2018-07-18 14:47:22 +00:00
"k8s.io/apimachinery/pkg/runtime/schema"
"k8s.io/kubernetes/pkg/api/legacyscheme"
2018-01-09 18:57:14 +00:00
"k8s.io/kubernetes/pkg/kubectl/cmd/templates"
cmdutil "k8s.io/kubernetes/pkg/kubectl/cmd/util"
2018-07-18 14:47:22 +00:00
"k8s.io/kubernetes/pkg/kubectl/genericclioptions"
"k8s.io/kubernetes/pkg/kubectl/genericclioptions/printers"
"k8s.io/kubernetes/pkg/kubectl/genericclioptions/resource"
"k8s.io/kubernetes/pkg/kubectl/scheme"
2018-01-09 18:57:14 +00:00
"k8s.io/kubernetes/pkg/kubectl/util/i18n"
)
type DrainOptions struct {
2018-07-18 14:47:22 +00:00
PrintFlags * genericclioptions . PrintFlags
ToPrinter func ( string ) ( printers . ResourcePrinterFunc , error )
Namespace string
2018-01-09 18:57:14 +00:00
client kubernetes . Interface
restClient * restclient . RESTClient
Force bool
DryRun bool
GracePeriodSeconds int
IgnoreDaemonsets bool
Timeout time . Duration
backOff clockwork . Clock
DeleteLocalData bool
Selector string
2018-03-06 22:33:18 +00:00
PodSelector string
2018-01-09 18:57:14 +00:00
nodeInfos [ ] * resource . Info
typer runtime . ObjectTyper
2018-07-18 14:47:22 +00:00
genericclioptions . IOStreams
2018-01-09 18:57:14 +00:00
}
// Takes a pod and returns a bool indicating whether or not to operate on the
// pod, an optional warning message, and an optional fatal error.
type podFilter func ( corev1 . Pod ) ( include bool , w * warning , f * fatal )
type warning struct {
string
}
type fatal struct {
string
}
const (
EvictionKind = "Eviction"
EvictionSubresource = "pods/eviction"
kDaemonsetFatal = "DaemonSet-managed pods (use --ignore-daemonsets to ignore)"
kDaemonsetWarning = "Ignoring DaemonSet-managed pods"
kLocalStorageFatal = "pods with local storage (use --delete-local-data to override)"
kLocalStorageWarning = "Deleting pods with local storage"
kUnmanagedFatal = "pods not managed by ReplicationController, ReplicaSet, Job, DaemonSet or StatefulSet (use --force to override)"
kUnmanagedWarning = "Deleting pods not managed by ReplicationController, ReplicaSet, Job, DaemonSet or StatefulSet"
)
var (
cordon_long = templates . LongDesc ( i18n . T ( `
Mark node as unschedulable . ` ) )
cordon_example = templates . Examples ( i18n . T ( `
# Mark node "foo" as unschedulable .
kubectl cordon foo ` ) )
)
2018-07-18 14:47:22 +00:00
func NewCmdCordon ( f cmdutil . Factory , ioStreams genericclioptions . IOStreams ) * cobra . Command {
options := & DrainOptions {
PrintFlags : genericclioptions . NewPrintFlags ( "cordoned" ) . WithTypeSetter ( scheme . Scheme ) ,
IOStreams : ioStreams ,
}
2018-01-09 18:57:14 +00:00
cmd := & cobra . Command {
2018-03-06 22:33:18 +00:00
Use : "cordon NODE" ,
DisableFlagsInUseLine : true ,
2018-01-09 18:57:14 +00:00
Short : i18n . T ( "Mark node as unschedulable" ) ,
Long : cordon_long ,
Example : cordon_example ,
Run : func ( cmd * cobra . Command , args [ ] string ) {
2018-07-18 14:47:22 +00:00
cmdutil . CheckErr ( options . Complete ( f , cmd , args ) )
2018-01-09 18:57:14 +00:00
cmdutil . CheckErr ( options . RunCordonOrUncordon ( true ) )
} ,
}
cmd . Flags ( ) . StringVarP ( & options . Selector , "selector" , "l" , options . Selector , "Selector (label query) to filter on" )
cmdutil . AddDryRunFlag ( cmd )
return cmd
}
var (
uncordon_long = templates . LongDesc ( i18n . T ( `
Mark node as schedulable . ` ) )
uncordon_example = templates . Examples ( i18n . T ( `
# Mark node "foo" as schedulable .
$ kubectl uncordon foo ` ) )
)
2018-07-18 14:47:22 +00:00
func NewCmdUncordon ( f cmdutil . Factory , ioStreams genericclioptions . IOStreams ) * cobra . Command {
options := & DrainOptions {
PrintFlags : genericclioptions . NewPrintFlags ( "uncordoned" ) . WithTypeSetter ( scheme . Scheme ) ,
IOStreams : ioStreams ,
}
2018-01-09 18:57:14 +00:00
cmd := & cobra . Command {
2018-03-06 22:33:18 +00:00
Use : "uncordon NODE" ,
DisableFlagsInUseLine : true ,
2018-01-09 18:57:14 +00:00
Short : i18n . T ( "Mark node as schedulable" ) ,
Long : uncordon_long ,
Example : uncordon_example ,
Run : func ( cmd * cobra . Command , args [ ] string ) {
2018-07-18 14:47:22 +00:00
cmdutil . CheckErr ( options . Complete ( f , cmd , args ) )
2018-01-09 18:57:14 +00:00
cmdutil . CheckErr ( options . RunCordonOrUncordon ( false ) )
} ,
}
cmd . Flags ( ) . StringVarP ( & options . Selector , "selector" , "l" , options . Selector , "Selector (label query) to filter on" )
cmdutil . AddDryRunFlag ( cmd )
return cmd
}
var (
drain_long = templates . LongDesc ( i18n . T ( `
Drain node in preparation for maintenance .
The given node will be marked unschedulable to prevent new pods from arriving .
' drain ' evicts the pods if the APIServer supports eviction
( http : //kubernetes.io/docs/admin/disruptions/). Otherwise, it will use normal DELETE
to delete the pods .
The ' drain ' evicts or deletes all pods except mirror pods ( which cannot be deleted through
the API server ) . If there are DaemonSet - managed pods , drain will not proceed
without -- ignore - daemonsets , and regardless it will not delete any
DaemonSet - managed pods , because those pods would be immediately replaced by the
DaemonSet controller , which ignores unschedulable markings . If there are any
pods that are neither mirror pods nor managed by ReplicationController ,
ReplicaSet , DaemonSet , StatefulSet or Job , then drain will not delete any pods unless you
use -- force . -- force will also allow deletion to proceed if the managing resource of one
or more pods is missing .
' drain ' waits for graceful termination . You should not operate on the machine until
the command completes .
When you are ready to put the node back into service , use kubectl uncordon , which
will make the node schedulable again .
! [ Workflow ] ( http : //kubernetes.io/images/docs/kubectl_drain.svg)`))
drain_example = templates . Examples ( i18n . T ( `
# Drain node "foo" , even if there are pods not managed by a ReplicationController , ReplicaSet , Job , DaemonSet or StatefulSet on it .
$ kubectl drain foo -- force
# As above , but abort if there are pods not managed by a ReplicationController , ReplicaSet , Job , DaemonSet or StatefulSet , and use a grace period of 15 minutes .
$ kubectl drain foo -- grace - period = 900 ` ) )
)
2018-07-18 14:47:22 +00:00
func NewDrainOptions ( f cmdutil . Factory , ioStreams genericclioptions . IOStreams ) * DrainOptions {
return & DrainOptions {
PrintFlags : genericclioptions . NewPrintFlags ( "drained" ) . WithTypeSetter ( scheme . Scheme ) ,
IOStreams : ioStreams ,
backOff : clockwork . NewRealClock ( ) ,
GracePeriodSeconds : - 1 ,
}
}
func NewCmdDrain ( f cmdutil . Factory , ioStreams genericclioptions . IOStreams ) * cobra . Command {
options := NewDrainOptions ( f , ioStreams )
2018-01-09 18:57:14 +00:00
cmd := & cobra . Command {
2018-03-06 22:33:18 +00:00
Use : "drain NODE" ,
DisableFlagsInUseLine : true ,
2018-01-09 18:57:14 +00:00
Short : i18n . T ( "Drain node in preparation for maintenance" ) ,
Long : drain_long ,
Example : drain_example ,
Run : func ( cmd * cobra . Command , args [ ] string ) {
2018-07-18 14:47:22 +00:00
cmdutil . CheckErr ( options . Complete ( f , cmd , args ) )
2018-01-09 18:57:14 +00:00
cmdutil . CheckErr ( options . RunDrain ( ) )
} ,
}
2018-07-18 14:47:22 +00:00
cmd . Flags ( ) . BoolVar ( & options . Force , "force" , options . Force , "Continue even if there are pods not managed by a ReplicationController, ReplicaSet, Job, DaemonSet or StatefulSet." )
cmd . Flags ( ) . BoolVar ( & options . IgnoreDaemonsets , "ignore-daemonsets" , options . IgnoreDaemonsets , "Ignore DaemonSet-managed pods." )
cmd . Flags ( ) . BoolVar ( & options . DeleteLocalData , "delete-local-data" , options . DeleteLocalData , "Continue even if there are pods using emptyDir (local data that will be deleted when the node is drained)." )
cmd . Flags ( ) . IntVar ( & options . GracePeriodSeconds , "grace-period" , options . GracePeriodSeconds , "Period of time in seconds given to each pod to terminate gracefully. If negative, the default value specified in the pod will be used." )
cmd . Flags ( ) . DurationVar ( & options . Timeout , "timeout" , options . Timeout , "The length of time to wait before giving up, zero means infinite" )
2018-01-09 18:57:14 +00:00
cmd . Flags ( ) . StringVarP ( & options . Selector , "selector" , "l" , options . Selector , "Selector (label query) to filter on" )
2018-03-06 22:33:18 +00:00
cmd . Flags ( ) . StringVarP ( & options . PodSelector , "pod-selector" , "" , options . PodSelector , "Label selector to filter pods on the node" )
2018-01-09 18:57:14 +00:00
cmdutil . AddDryRunFlag ( cmd )
return cmd
}
2018-07-18 14:47:22 +00:00
// Complete populates some fields from the factory, grabs command line
2018-01-09 18:57:14 +00:00
// arguments and looks up the node using Builder
2018-07-18 14:47:22 +00:00
func ( o * DrainOptions ) Complete ( f cmdutil . Factory , cmd * cobra . Command , args [ ] string ) error {
2018-01-09 18:57:14 +00:00
var err error
if len ( args ) == 0 && ! cmd . Flags ( ) . Changed ( "selector" ) {
return cmdutil . UsageErrorf ( cmd , fmt . Sprintf ( "USAGE: %s [flags]" , cmd . Use ) )
}
if len ( args ) > 0 && len ( o . Selector ) > 0 {
return cmdutil . UsageErrorf ( cmd , "error: cannot specify both a node name and a --selector option" )
}
if len ( args ) > 0 && len ( args ) != 1 {
return cmdutil . UsageErrorf ( cmd , fmt . Sprintf ( "USAGE: %s [flags]" , cmd . Use ) )
}
2018-03-06 22:33:18 +00:00
o . DryRun = cmdutil . GetDryRunFlag ( cmd )
2018-01-09 18:57:14 +00:00
2018-07-18 14:47:22 +00:00
if o . client , err = f . KubernetesClientSet ( ) ; err != nil {
2018-01-09 18:57:14 +00:00
return err
}
2018-03-06 22:33:18 +00:00
if len ( o . PodSelector ) > 0 {
if _ , err := labels . Parse ( o . PodSelector ) ; err != nil {
return errors . New ( "--pod-selector=<pod_selector> must be a valid label selector" )
}
}
2018-07-18 14:47:22 +00:00
o . restClient , err = f . RESTClient ( )
2018-01-09 18:57:14 +00:00
if err != nil {
return err
}
o . nodeInfos = [ ] * resource . Info { }
2018-07-18 14:47:22 +00:00
o . Namespace , _ , err = f . ToRawKubeConfigLoader ( ) . Namespace ( )
2018-01-09 18:57:14 +00:00
if err != nil {
return err
}
2018-07-18 14:47:22 +00:00
o . ToPrinter = func ( operation string ) ( printers . ResourcePrinterFunc , error ) {
o . PrintFlags . NamePrintFlags . Operation = operation
if o . DryRun {
o . PrintFlags . Complete ( "%s (dry run)" )
}
printer , err := o . PrintFlags . ToPrinter ( )
if err != nil {
return nil , err
}
return printer . PrintObj , nil
}
builder := f . NewBuilder ( ) .
WithScheme ( legacyscheme . Scheme ) .
NamespaceParam ( o . Namespace ) . DefaultNamespace ( ) .
2018-01-09 18:57:14 +00:00
ResourceNames ( "nodes" , args ... ) .
SingleResourceType ( ) .
Flatten ( )
if len ( o . Selector ) > 0 {
builder = builder . LabelSelectorParam ( o . Selector ) .
ResourceTypes ( "nodes" )
}
r := builder . Do ( )
if err = r . Err ( ) ; err != nil {
return err
}
return r . Visit ( func ( info * resource . Info , err error ) error {
if err != nil {
return err
}
2018-07-18 14:47:22 +00:00
if info . Mapping . Resource . GroupResource ( ) != ( schema . GroupResource { Group : "" , Resource : "nodes" } ) {
2018-01-09 18:57:14 +00:00
return fmt . Errorf ( "error: expected resource of type node, got %q" , info . Mapping . Resource )
}
o . nodeInfos = append ( o . nodeInfos , info )
return nil
} )
}
// RunDrain runs the 'drain' command
func ( o * DrainOptions ) RunDrain ( ) error {
if err := o . RunCordonOrUncordon ( true ) ; err != nil {
return err
}
2018-07-18 14:47:22 +00:00
printObj , err := o . ToPrinter ( "drained" )
if err != nil {
return err
}
2018-01-09 18:57:14 +00:00
drainedNodes := sets . NewString ( )
var fatal error
for _ , info := range o . nodeInfos {
var err error
if ! o . DryRun {
err = o . deleteOrEvictPodsSimple ( info )
}
if err == nil || o . DryRun {
drainedNodes . Insert ( info . Name )
2018-07-18 14:47:22 +00:00
printObj ( info . Object , o . Out )
2018-01-09 18:57:14 +00:00
} else {
fmt . Fprintf ( o . ErrOut , "error: unable to drain node %q, aborting command...\n\n" , info . Name )
remainingNodes := [ ] string { }
fatal = err
for _ , remainingInfo := range o . nodeInfos {
if drainedNodes . Has ( remainingInfo . Name ) {
continue
}
remainingNodes = append ( remainingNodes , remainingInfo . Name )
}
if len ( remainingNodes ) > 0 {
fmt . Fprintf ( o . ErrOut , "There are pending nodes to be drained:\n" )
for _ , nodeName := range remainingNodes {
fmt . Fprintf ( o . ErrOut , " %s\n" , nodeName )
}
}
break
}
}
return fatal
}
func ( o * DrainOptions ) deleteOrEvictPodsSimple ( nodeInfo * resource . Info ) error {
pods , err := o . getPodsForDeletion ( nodeInfo )
if err != nil {
return err
}
err = o . deleteOrEvictPods ( pods )
if err != nil {
pendingPods , newErr := o . getPodsForDeletion ( nodeInfo )
if newErr != nil {
return newErr
}
fmt . Fprintf ( o . ErrOut , "There are pending pods in node %q when an error occurred: %v\n" , nodeInfo . Name , err )
for _ , pendingPod := range pendingPods {
fmt . Fprintf ( o . ErrOut , "%s/%s\n" , "pod" , pendingPod . Name )
}
}
return err
}
2018-03-06 22:33:18 +00:00
func ( o * DrainOptions ) getPodController ( pod corev1 . Pod ) * metav1 . OwnerReference {
return metav1 . GetControllerOf ( & pod )
2018-01-09 18:57:14 +00:00
}
func ( o * DrainOptions ) unreplicatedFilter ( pod corev1 . Pod ) ( bool , * warning , * fatal ) {
// any finished pod can be removed
if pod . Status . Phase == corev1 . PodSucceeded || pod . Status . Phase == corev1 . PodFailed {
return true , nil , nil
}
2018-03-06 22:33:18 +00:00
controllerRef := o . getPodController ( pod )
2018-01-09 18:57:14 +00:00
if controllerRef != nil {
return true , nil , nil
}
2018-03-06 22:33:18 +00:00
if o . Force {
return true , & warning { kUnmanagedWarning } , nil
2018-01-09 18:57:14 +00:00
}
2018-03-06 22:33:18 +00:00
return false , nil , & fatal { kUnmanagedFatal }
2018-01-09 18:57:14 +00:00
}
func ( o * DrainOptions ) daemonsetFilter ( pod corev1 . Pod ) ( bool , * warning , * fatal ) {
// Note that we return false in cases where the pod is DaemonSet managed,
// regardless of flags. We never delete them, the only question is whether
// their presence constitutes an error.
//
// The exception is for pods that are orphaned (the referencing
// management resource - including DaemonSet - is not found).
// Such pods will be deleted if --force is used.
2018-03-06 22:33:18 +00:00
controllerRef := o . getPodController ( pod )
2018-01-09 18:57:14 +00:00
if controllerRef == nil || controllerRef . Kind != "DaemonSet" {
return true , nil , nil
}
2018-03-06 22:33:18 +00:00
if _ , err := o . client . ExtensionsV1beta1 ( ) . DaemonSets ( pod . Namespace ) . Get ( controllerRef . Name , metav1 . GetOptions { } ) ; err != nil {
// remove orphaned pods with a warning if --force is used
if apierrors . IsNotFound ( err ) && o . Force {
return true , & warning { err . Error ( ) } , nil
}
2018-01-09 18:57:14 +00:00
return false , nil , & fatal { err . Error ( ) }
}
2018-03-06 22:33:18 +00:00
2018-01-09 18:57:14 +00:00
if ! o . IgnoreDaemonsets {
return false , nil , & fatal { kDaemonsetFatal }
}
2018-03-06 22:33:18 +00:00
2018-01-09 18:57:14 +00:00
return false , & warning { kDaemonsetWarning } , nil
}
func mirrorPodFilter ( pod corev1 . Pod ) ( bool , * warning , * fatal ) {
if _ , found := pod . ObjectMeta . Annotations [ corev1 . MirrorPodAnnotationKey ] ; found {
return false , nil , nil
}
return true , nil , nil
}
func hasLocalStorage ( pod corev1 . Pod ) bool {
for _ , volume := range pod . Spec . Volumes {
if volume . EmptyDir != nil {
return true
}
}
return false
}
func ( o * DrainOptions ) localStorageFilter ( pod corev1 . Pod ) ( bool , * warning , * fatal ) {
if ! hasLocalStorage ( pod ) {
return true , nil , nil
}
if ! o . DeleteLocalData {
return false , nil , & fatal { kLocalStorageFatal }
}
return true , & warning { kLocalStorageWarning } , nil
}
// Map of status message to a list of pod names having that status.
type podStatuses map [ string ] [ ] string
func ( ps podStatuses ) Message ( ) string {
msgs := [ ] string { }
for key , pods := range ps {
msgs = append ( msgs , fmt . Sprintf ( "%s: %s" , key , strings . Join ( pods , ", " ) ) )
}
return strings . Join ( msgs , "; " )
}
// getPodsForDeletion receives resource info for a node, and returns all the pods from the given node that we
// are planning on deleting. If there are any pods preventing us from deleting, we return that list in an error.
func ( o * DrainOptions ) getPodsForDeletion ( nodeInfo * resource . Info ) ( pods [ ] corev1 . Pod , err error ) {
2018-03-06 22:33:18 +00:00
labelSelector , err := labels . Parse ( o . PodSelector )
if err != nil {
return pods , err
}
podList , err := o . client . CoreV1 ( ) . Pods ( metav1 . NamespaceAll ) . List ( metav1 . ListOptions {
LabelSelector : labelSelector . String ( ) ,
2018-01-09 18:57:14 +00:00
FieldSelector : fields . SelectorFromSet ( fields . Set { "spec.nodeName" : nodeInfo . Name } ) . String ( ) } )
if err != nil {
return pods , err
}
ws := podStatuses { }
fs := podStatuses { }
for _ , pod := range podList . Items {
podOk := true
2018-03-06 22:33:18 +00:00
for _ , filt := range [ ] podFilter { o . daemonsetFilter , mirrorPodFilter , o . localStorageFilter , o . unreplicatedFilter } {
2018-01-09 18:57:14 +00:00
filterOk , w , f := filt ( pod )
podOk = podOk && filterOk
if w != nil {
ws [ w . string ] = append ( ws [ w . string ] , pod . Name )
}
if f != nil {
fs [ f . string ] = append ( fs [ f . string ] , pod . Name )
}
2018-03-06 22:33:18 +00:00
// short-circuit as soon as pod not ok
// at that point, there is no reason to run pod
// through any additional filters
if ! podOk {
break
}
2018-01-09 18:57:14 +00:00
}
if podOk {
pods = append ( pods , pod )
}
}
if len ( fs ) > 0 {
return [ ] corev1 . Pod { } , errors . New ( fs . Message ( ) )
}
if len ( ws ) > 0 {
fmt . Fprintf ( o . ErrOut , "WARNING: %s\n" , ws . Message ( ) )
}
return pods , nil
}
func ( o * DrainOptions ) deletePod ( pod corev1 . Pod ) error {
deleteOptions := & metav1 . DeleteOptions { }
if o . GracePeriodSeconds >= 0 {
gracePeriodSeconds := int64 ( o . GracePeriodSeconds )
deleteOptions . GracePeriodSeconds = & gracePeriodSeconds
}
2018-03-06 22:33:18 +00:00
return o . client . CoreV1 ( ) . Pods ( pod . Namespace ) . Delete ( pod . Name , deleteOptions )
2018-01-09 18:57:14 +00:00
}
func ( o * DrainOptions ) evictPod ( pod corev1 . Pod , policyGroupVersion string ) error {
deleteOptions := & metav1 . DeleteOptions { }
if o . GracePeriodSeconds >= 0 {
gracePeriodSeconds := int64 ( o . GracePeriodSeconds )
deleteOptions . GracePeriodSeconds = & gracePeriodSeconds
}
eviction := & policyv1beta1 . Eviction {
TypeMeta : metav1 . TypeMeta {
APIVersion : policyGroupVersion ,
Kind : EvictionKind ,
} ,
ObjectMeta : metav1 . ObjectMeta {
Name : pod . Name ,
Namespace : pod . Namespace ,
} ,
DeleteOptions : deleteOptions ,
}
// Remember to change change the URL manipulation func when Evction's version change
2018-03-06 22:33:18 +00:00
return o . client . PolicyV1beta1 ( ) . Evictions ( eviction . Namespace ) . Evict ( eviction )
2018-01-09 18:57:14 +00:00
}
// deleteOrEvictPods deletes or evicts the pods on the api server
func ( o * DrainOptions ) deleteOrEvictPods ( pods [ ] corev1 . Pod ) error {
if len ( pods ) == 0 {
return nil
}
policyGroupVersion , err := SupportEviction ( o . client )
if err != nil {
return err
}
getPodFn := func ( namespace , name string ) ( * corev1 . Pod , error ) {
2018-03-06 22:33:18 +00:00
return o . client . CoreV1 ( ) . Pods ( namespace ) . Get ( name , metav1 . GetOptions { } )
2018-01-09 18:57:14 +00:00
}
if len ( policyGroupVersion ) > 0 {
return o . evictPods ( pods , policyGroupVersion , getPodFn )
} else {
return o . deletePods ( pods , getPodFn )
}
}
func ( o * DrainOptions ) evictPods ( pods [ ] corev1 . Pod , policyGroupVersion string , getPodFn func ( namespace , name string ) ( * corev1 . Pod , error ) ) error {
doneCh := make ( chan bool , len ( pods ) )
errCh := make ( chan error , 1 )
for _ , pod := range pods {
go func ( pod corev1 . Pod , doneCh chan bool , errCh chan error ) {
var err error
for {
err = o . evictPod ( pod , policyGroupVersion )
if err == nil {
break
} else if apierrors . IsNotFound ( err ) {
doneCh <- true
return
} else if apierrors . IsTooManyRequests ( err ) {
time . Sleep ( 5 * time . Second )
} else {
errCh <- fmt . Errorf ( "error when evicting pod %q: %v" , pod . Name , err )
return
}
}
podArray := [ ] corev1 . Pod { pod }
2018-07-18 14:47:22 +00:00
_ , err = o . waitForDelete ( podArray , 1 * time . Second , time . Duration ( math . MaxInt64 ) , true , getPodFn )
2018-01-09 18:57:14 +00:00
if err == nil {
doneCh <- true
} else {
errCh <- fmt . Errorf ( "error when waiting for pod %q terminating: %v" , pod . Name , err )
}
} ( pod , doneCh , errCh )
}
doneCount := 0
// 0 timeout means infinite, we use MaxInt64 to represent it.
var globalTimeout time . Duration
if o . Timeout == 0 {
globalTimeout = time . Duration ( math . MaxInt64 )
} else {
globalTimeout = o . Timeout
}
for {
select {
case err := <- errCh :
return err
case <- doneCh :
doneCount ++
if doneCount == len ( pods ) {
return nil
}
case <- time . After ( globalTimeout ) :
return fmt . Errorf ( "Drain did not complete within %v" , globalTimeout )
}
}
}
func ( o * DrainOptions ) deletePods ( pods [ ] corev1 . Pod , getPodFn func ( namespace , name string ) ( * corev1 . Pod , error ) ) error {
// 0 timeout means infinite, we use MaxInt64 to represent it.
var globalTimeout time . Duration
if o . Timeout == 0 {
globalTimeout = time . Duration ( math . MaxInt64 )
} else {
globalTimeout = o . Timeout
}
for _ , pod := range pods {
err := o . deletePod ( pod )
if err != nil && ! apierrors . IsNotFound ( err ) {
return err
}
}
2018-07-18 14:47:22 +00:00
_ , err := o . waitForDelete ( pods , 1 * time . Second , globalTimeout , false , getPodFn )
2018-01-09 18:57:14 +00:00
return err
}
func ( o * DrainOptions ) waitForDelete ( pods [ ] corev1 . Pod , interval , timeout time . Duration , usingEviction bool , getPodFn func ( string , string ) ( * corev1 . Pod , error ) ) ( [ ] corev1 . Pod , error ) {
var verbStr string
if usingEviction {
verbStr = "evicted"
} else {
verbStr = "deleted"
}
2018-07-18 14:47:22 +00:00
printObj , err := o . ToPrinter ( verbStr )
if err != nil {
return pods , err
}
err = wait . PollImmediate ( interval , timeout , func ( ) ( bool , error ) {
2018-01-09 18:57:14 +00:00
pendingPods := [ ] corev1 . Pod { }
for i , pod := range pods {
p , err := getPodFn ( pod . Namespace , pod . Name )
if apierrors . IsNotFound ( err ) || ( p != nil && p . ObjectMeta . UID != pod . ObjectMeta . UID ) {
2018-07-18 14:47:22 +00:00
printObj ( & pod , o . Out )
2018-01-09 18:57:14 +00:00
continue
} else if err != nil {
return false , err
} else {
pendingPods = append ( pendingPods , pods [ i ] )
}
}
pods = pendingPods
if len ( pendingPods ) > 0 {
return false , nil
}
return true , nil
} )
return pods , err
}
// SupportEviction uses Discovery API to find out if the server support eviction subresource
// If support, it will return its groupVersion; Otherwise, it will return ""
func SupportEviction ( clientset kubernetes . Interface ) ( string , error ) {
discoveryClient := clientset . Discovery ( )
groupList , err := discoveryClient . ServerGroups ( )
if err != nil {
return "" , err
}
foundPolicyGroup := false
var policyGroupVersion string
for _ , group := range groupList . Groups {
if group . Name == "policy" {
foundPolicyGroup = true
policyGroupVersion = group . PreferredVersion . GroupVersion
break
}
}
if ! foundPolicyGroup {
return "" , nil
}
resourceList , err := discoveryClient . ServerResourcesForGroupVersion ( "v1" )
if err != nil {
return "" , err
}
for _ , resource := range resourceList . APIResources {
if resource . Name == EvictionSubresource && resource . Kind == EvictionKind {
return policyGroupVersion , nil
}
}
return "" , nil
}
// RunCordonOrUncordon runs either Cordon or Uncordon. The desired value for
// "Unschedulable" is passed as the first arg.
func ( o * DrainOptions ) RunCordonOrUncordon ( desired bool ) error {
cordonOrUncordon := "cordon"
if ! desired {
cordonOrUncordon = "un" + cordonOrUncordon
}
for _ , nodeInfo := range o . nodeInfos {
if nodeInfo . Mapping . GroupVersionKind . Kind == "Node" {
2018-07-18 14:47:22 +00:00
obj , err := legacyscheme . Scheme . ConvertToVersion ( nodeInfo . Object , nodeInfo . Mapping . GroupVersionKind . GroupVersion ( ) )
2018-01-09 18:57:14 +00:00
if err != nil {
fmt . Printf ( "error: unable to %s node %q: %v" , cordonOrUncordon , nodeInfo . Name , err )
continue
}
oldData , err := json . Marshal ( obj )
if err != nil {
fmt . Printf ( "error: unable to %s node %q: %v" , cordonOrUncordon , nodeInfo . Name , err )
continue
}
node , ok := obj . ( * corev1 . Node )
if ! ok {
fmt . Fprintf ( o . ErrOut , "error: unable to %s node %q: unexpected Type%T, expected Node" , cordonOrUncordon , nodeInfo . Name , obj )
continue
}
unsched := node . Spec . Unschedulable
if unsched == desired {
2018-07-18 14:47:22 +00:00
printObj , err := o . ToPrinter ( already ( desired ) )
if err != nil {
fmt . Printf ( "error: %v" , err )
continue
}
printObj ( cmdutil . AsDefaultVersionedOrOriginal ( nodeInfo . Object , nodeInfo . Mapping ) , o . Out )
2018-01-09 18:57:14 +00:00
} else {
if ! o . DryRun {
helper := resource . NewHelper ( o . restClient , nodeInfo . Mapping )
node . Spec . Unschedulable = desired
newData , err := json . Marshal ( obj )
if err != nil {
fmt . Fprintf ( o . ErrOut , "error: unable to %s node %q: %v" , cordonOrUncordon , nodeInfo . Name , err )
continue
}
patchBytes , err := strategicpatch . CreateTwoWayMergePatch ( oldData , newData , obj )
if err != nil {
fmt . Printf ( "error: unable to %s node %q: %v" , cordonOrUncordon , nodeInfo . Name , err )
continue
}
2018-07-18 14:47:22 +00:00
_ , err = helper . Patch ( o . Namespace , nodeInfo . Name , types . StrategicMergePatchType , patchBytes )
2018-01-09 18:57:14 +00:00
if err != nil {
fmt . Printf ( "error: unable to %s node %q: %v" , cordonOrUncordon , nodeInfo . Name , err )
continue
}
}
2018-07-18 14:47:22 +00:00
printObj , err := o . ToPrinter ( changed ( desired ) )
if err != nil {
fmt . Fprintf ( o . ErrOut , "%v" , err )
continue
}
printObj ( cmdutil . AsDefaultVersionedOrOriginal ( nodeInfo . Object , nodeInfo . Mapping ) , o . Out )
2018-01-09 18:57:14 +00:00
}
} else {
2018-07-18 14:47:22 +00:00
printObj , err := o . ToPrinter ( "skipped" )
if err != nil {
fmt . Fprintf ( o . ErrOut , "%v" , err )
continue
}
printObj ( cmdutil . AsDefaultVersionedOrOriginal ( nodeInfo . Object , nodeInfo . Mapping ) , o . Out )
2018-01-09 18:57:14 +00:00
}
}
return nil
}
// already() and changed() return suitable strings for {un,}cordoning
func already ( desired bool ) string {
if desired {
return "already cordoned"
}
return "already uncordoned"
}
func changed ( desired bool ) string {
if desired {
return "cordoned"
}
return "uncordoned"
}