mirror of
https://github.com/ceph/ceph-csi.git
synced 2025-01-24 21:59:29 +00:00
396 lines
14 KiB
Go
396 lines
14 KiB
Go
|
/*
|
||
|
Copyright 2017 The Kubernetes Authors.
|
||
|
|
||
|
Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
you may not use this file except in compliance with the License.
|
||
|
You may obtain a copy of the License at
|
||
|
|
||
|
http://www.apache.org/licenses/LICENSE-2.0
|
||
|
|
||
|
Unless required by applicable law or agreed to in writing, software
|
||
|
distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
See the License for the specific language governing permissions and
|
||
|
limitations under the License.
|
||
|
*/
|
||
|
|
||
|
package scheduler
|
||
|
|
||
|
import (
|
||
|
"fmt"
|
||
|
"testing"
|
||
|
"time"
|
||
|
|
||
|
"k8s.io/api/core/v1"
|
||
|
"k8s.io/apimachinery/pkg/api/errors"
|
||
|
"k8s.io/apimachinery/pkg/api/resource"
|
||
|
metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
|
||
|
"k8s.io/apimachinery/pkg/util/uuid"
|
||
|
"k8s.io/apimachinery/pkg/util/wait"
|
||
|
"k8s.io/client-go/informers"
|
||
|
clientset "k8s.io/client-go/kubernetes"
|
||
|
clientv1core "k8s.io/client-go/kubernetes/typed/core/v1"
|
||
|
corelisters "k8s.io/client-go/listers/core/v1"
|
||
|
restclient "k8s.io/client-go/rest"
|
||
|
"k8s.io/client-go/tools/record"
|
||
|
"k8s.io/kubernetes/pkg/api/legacyscheme"
|
||
|
podutil "k8s.io/kubernetes/pkg/api/v1/pod"
|
||
|
"k8s.io/kubernetes/plugin/pkg/scheduler"
|
||
|
_ "k8s.io/kubernetes/plugin/pkg/scheduler/algorithmprovider"
|
||
|
"k8s.io/kubernetes/plugin/pkg/scheduler/factory"
|
||
|
"k8s.io/kubernetes/test/integration/framework"
|
||
|
|
||
|
"net/http/httptest"
|
||
|
)
|
||
|
|
||
|
type TestContext struct {
|
||
|
closeFn framework.CloseFunc
|
||
|
httpServer *httptest.Server
|
||
|
ns *v1.Namespace
|
||
|
clientSet *clientset.Clientset
|
||
|
informerFactory informers.SharedInformerFactory
|
||
|
schedulerConfigFactory scheduler.Configurator
|
||
|
schedulerConfig *scheduler.Config
|
||
|
scheduler *scheduler.Scheduler
|
||
|
}
|
||
|
|
||
|
// initTest initializes a test environment and creates a scheduler with default
|
||
|
// configuration.
|
||
|
func initTest(t *testing.T, nsPrefix string) *TestContext {
|
||
|
var context TestContext
|
||
|
masterConfig := framework.NewIntegrationTestMasterConfig()
|
||
|
_, context.httpServer, context.closeFn = framework.RunAMaster(masterConfig)
|
||
|
|
||
|
context.ns = framework.CreateTestingNamespace(nsPrefix+string(uuid.NewUUID()), context.httpServer, t)
|
||
|
|
||
|
context.clientSet = clientset.NewForConfigOrDie(&restclient.Config{Host: context.httpServer.URL})
|
||
|
context.informerFactory = informers.NewSharedInformerFactory(context.clientSet, 0)
|
||
|
podInformer := factory.NewPodInformer(context.clientSet, 12*time.Hour, v1.DefaultSchedulerName)
|
||
|
context.schedulerConfigFactory = factory.NewConfigFactory(
|
||
|
v1.DefaultSchedulerName,
|
||
|
context.clientSet,
|
||
|
context.informerFactory.Core().V1().Nodes(),
|
||
|
podInformer,
|
||
|
context.informerFactory.Core().V1().PersistentVolumes(),
|
||
|
context.informerFactory.Core().V1().PersistentVolumeClaims(),
|
||
|
context.informerFactory.Core().V1().ReplicationControllers(),
|
||
|
context.informerFactory.Extensions().V1beta1().ReplicaSets(),
|
||
|
context.informerFactory.Apps().V1beta1().StatefulSets(),
|
||
|
context.informerFactory.Core().V1().Services(),
|
||
|
context.informerFactory.Policy().V1beta1().PodDisruptionBudgets(),
|
||
|
context.informerFactory.Storage().V1().StorageClasses(),
|
||
|
v1.DefaultHardPodAffinitySymmetricWeight,
|
||
|
true,
|
||
|
)
|
||
|
var err error
|
||
|
context.schedulerConfig, err = context.schedulerConfigFactory.Create()
|
||
|
if err != nil {
|
||
|
t.Fatalf("Couldn't create scheduler config: %v", err)
|
||
|
}
|
||
|
eventBroadcaster := record.NewBroadcaster()
|
||
|
context.schedulerConfig.Recorder = eventBroadcaster.NewRecorder(legacyscheme.Scheme, v1.EventSource{Component: v1.DefaultSchedulerName})
|
||
|
eventBroadcaster.StartRecordingToSink(&clientv1core.EventSinkImpl{Interface: clientv1core.New(context.clientSet.CoreV1().RESTClient()).Events("")})
|
||
|
go podInformer.Informer().Run(context.schedulerConfig.StopEverything)
|
||
|
context.informerFactory.Start(context.schedulerConfig.StopEverything)
|
||
|
context.scheduler, err = scheduler.NewFromConfigurator(&scheduler.FakeConfigurator{Config: context.schedulerConfig}, nil...)
|
||
|
if err != nil {
|
||
|
t.Fatalf("Couldn't create scheduler: %v", err)
|
||
|
}
|
||
|
context.scheduler.Run()
|
||
|
return &context
|
||
|
}
|
||
|
|
||
|
// cleanupTest deletes the scheduler and the test namespace. It should be called
|
||
|
// at the end of a test.
|
||
|
func cleanupTest(t *testing.T, context *TestContext) {
|
||
|
// Kill the scheduler.
|
||
|
close(context.schedulerConfig.StopEverything)
|
||
|
// Cleanup nodes.
|
||
|
context.clientSet.CoreV1().Nodes().DeleteCollection(nil, metav1.ListOptions{})
|
||
|
framework.DeleteTestingNamespace(context.ns, context.httpServer, t)
|
||
|
context.closeFn()
|
||
|
}
|
||
|
|
||
|
// waitForReflection waits till the passFunc confirms that the object it expects
|
||
|
// to see is in the store. Used to observe reflected events.
|
||
|
func waitForReflection(t *testing.T, nodeLister corelisters.NodeLister, key string, passFunc func(n interface{}) bool) error {
|
||
|
nodes := []*v1.Node{}
|
||
|
err := wait.Poll(time.Millisecond*100, wait.ForeverTestTimeout, func() (bool, error) {
|
||
|
n, err := nodeLister.Get(key)
|
||
|
|
||
|
switch {
|
||
|
case err == nil && passFunc(n):
|
||
|
return true, nil
|
||
|
case errors.IsNotFound(err):
|
||
|
nodes = append(nodes, nil)
|
||
|
case err != nil:
|
||
|
t.Errorf("Unexpected error: %v", err)
|
||
|
default:
|
||
|
nodes = append(nodes, n)
|
||
|
}
|
||
|
|
||
|
return false, nil
|
||
|
})
|
||
|
if err != nil {
|
||
|
t.Logf("Logging consecutive node versions received from store:")
|
||
|
for i, n := range nodes {
|
||
|
t.Logf("%d: %#v", i, n)
|
||
|
}
|
||
|
}
|
||
|
return err
|
||
|
}
|
||
|
|
||
|
// nodeHasLabels returns a function that checks if a node has all the given labels.
|
||
|
func nodeHasLabels(cs clientset.Interface, nodeName string, labels map[string]string) wait.ConditionFunc {
|
||
|
return func() (bool, error) {
|
||
|
node, err := cs.CoreV1().Nodes().Get(nodeName, metav1.GetOptions{})
|
||
|
if errors.IsNotFound(err) {
|
||
|
return false, nil
|
||
|
}
|
||
|
if err != nil {
|
||
|
// This could be a connection error so we want to retry.
|
||
|
return false, nil
|
||
|
}
|
||
|
for k, v := range labels {
|
||
|
if node.Labels == nil || node.Labels[k] != v {
|
||
|
return false, nil
|
||
|
}
|
||
|
}
|
||
|
return true, nil
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// waitForNodeLabels waits for the given node to have all the given labels.
|
||
|
func waitForNodeLabels(cs clientset.Interface, nodeName string, labels map[string]string) error {
|
||
|
return wait.Poll(time.Millisecond*100, wait.ForeverTestTimeout, nodeHasLabels(cs, nodeName, labels))
|
||
|
}
|
||
|
|
||
|
// createNode creates a node with the given resource list and
|
||
|
// returns a pointer and error status. If 'res' is nil, a predefined amount of
|
||
|
// resource will be used.
|
||
|
func createNode(cs clientset.Interface, name string, res *v1.ResourceList) (*v1.Node, error) {
|
||
|
// if resource is nil, we use a default amount of resources for the node.
|
||
|
if res == nil {
|
||
|
res = &v1.ResourceList{
|
||
|
v1.ResourcePods: *resource.NewQuantity(32, resource.DecimalSI),
|
||
|
}
|
||
|
}
|
||
|
n := &v1.Node{
|
||
|
ObjectMeta: metav1.ObjectMeta{Name: name},
|
||
|
Spec: v1.NodeSpec{Unschedulable: false},
|
||
|
Status: v1.NodeStatus{
|
||
|
Capacity: *res,
|
||
|
},
|
||
|
}
|
||
|
return cs.CoreV1().Nodes().Create(n)
|
||
|
}
|
||
|
|
||
|
// createNodes creates `numNodes` nodes. The created node names will be in the
|
||
|
// form of "`prefix`-X" where X is an ordinal.
|
||
|
func createNodes(cs clientset.Interface, prefix string, res *v1.ResourceList, numNodes int) ([]*v1.Node, error) {
|
||
|
nodes := make([]*v1.Node, numNodes)
|
||
|
for i := 0; i < numNodes; i++ {
|
||
|
nodeName := fmt.Sprintf("%v-%d", prefix, i)
|
||
|
node, err := createNode(cs, nodeName, res)
|
||
|
if err != nil {
|
||
|
return nodes[:], err
|
||
|
}
|
||
|
nodes[i] = node
|
||
|
}
|
||
|
return nodes[:], nil
|
||
|
}
|
||
|
|
||
|
type pausePodConfig struct {
|
||
|
Name string
|
||
|
Namespace string
|
||
|
Affinity *v1.Affinity
|
||
|
Annotations, Labels, NodeSelector map[string]string
|
||
|
Resources *v1.ResourceRequirements
|
||
|
Tolerations []v1.Toleration
|
||
|
NodeName string
|
||
|
SchedulerName string
|
||
|
Priority *int32
|
||
|
}
|
||
|
|
||
|
// initPausePod initializes a pod API object from the given config. It is used
|
||
|
// mainly in pod creation process.
|
||
|
func initPausePod(cs clientset.Interface, conf *pausePodConfig) *v1.Pod {
|
||
|
pod := &v1.Pod{
|
||
|
ObjectMeta: metav1.ObjectMeta{
|
||
|
Name: conf.Name,
|
||
|
Namespace: conf.Namespace,
|
||
|
Labels: conf.Labels,
|
||
|
Annotations: conf.Annotations,
|
||
|
},
|
||
|
Spec: v1.PodSpec{
|
||
|
NodeSelector: conf.NodeSelector,
|
||
|
Affinity: conf.Affinity,
|
||
|
Containers: []v1.Container{
|
||
|
{
|
||
|
Name: conf.Name,
|
||
|
Image: framework.GetPauseImageName(cs),
|
||
|
},
|
||
|
},
|
||
|
Tolerations: conf.Tolerations,
|
||
|
NodeName: conf.NodeName,
|
||
|
SchedulerName: conf.SchedulerName,
|
||
|
Priority: conf.Priority,
|
||
|
},
|
||
|
}
|
||
|
if conf.Resources != nil {
|
||
|
pod.Spec.Containers[0].Resources = *conf.Resources
|
||
|
}
|
||
|
return pod
|
||
|
}
|
||
|
|
||
|
// createPausePod creates a pod with "Pause" image and the given config and
|
||
|
// return its pointer and error status.
|
||
|
func createPausePod(cs clientset.Interface, p *v1.Pod) (*v1.Pod, error) {
|
||
|
return cs.CoreV1().Pods(p.Namespace).Create(p)
|
||
|
}
|
||
|
|
||
|
// createPausePodWithResource creates a pod with "Pause" image and the given
|
||
|
// resources and returns its pointer and error status. The resource list can be
|
||
|
// nil.
|
||
|
func createPausePodWithResource(cs clientset.Interface, podName string, nsName string, res *v1.ResourceList) (*v1.Pod, error) {
|
||
|
var conf pausePodConfig
|
||
|
if res == nil {
|
||
|
conf = pausePodConfig{
|
||
|
Name: podName,
|
||
|
Namespace: nsName,
|
||
|
}
|
||
|
} else {
|
||
|
conf = pausePodConfig{
|
||
|
Name: podName,
|
||
|
Namespace: nsName,
|
||
|
Resources: &v1.ResourceRequirements{
|
||
|
Requests: *res,
|
||
|
},
|
||
|
}
|
||
|
}
|
||
|
return createPausePod(cs, initPausePod(cs, &conf))
|
||
|
}
|
||
|
|
||
|
// runPausePod creates a pod with "Pause" image and the given config and waits
|
||
|
// until it is scheduled. It returns its pointer and error status.
|
||
|
func runPausePod(cs clientset.Interface, pod *v1.Pod) (*v1.Pod, error) {
|
||
|
pod, err := cs.CoreV1().Pods(pod.Namespace).Create(pod)
|
||
|
if err != nil {
|
||
|
return nil, fmt.Errorf("Error creating pause pod: %v", err)
|
||
|
}
|
||
|
if err = waitForPodToSchedule(cs, pod); err != nil {
|
||
|
return pod, fmt.Errorf("Pod %v didn't schedule successfully. Error: %v", pod.Name, err)
|
||
|
}
|
||
|
if pod, err = cs.CoreV1().Pods(pod.Namespace).Get(pod.Name, metav1.GetOptions{}); err != nil {
|
||
|
return pod, fmt.Errorf("Error getting pod %v info: %v", pod.Name, err)
|
||
|
}
|
||
|
return pod, nil
|
||
|
}
|
||
|
|
||
|
// podDeleted returns true if a pod is not found in the given namespace.
|
||
|
func podDeleted(c clientset.Interface, podNamespace, podName string) wait.ConditionFunc {
|
||
|
return func() (bool, error) {
|
||
|
pod, err := c.CoreV1().Pods(podNamespace).Get(podName, metav1.GetOptions{})
|
||
|
if errors.IsNotFound(err) {
|
||
|
return true, nil
|
||
|
}
|
||
|
if pod.DeletionTimestamp != nil {
|
||
|
return true, nil
|
||
|
}
|
||
|
return false, nil
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// podIsGettingEvicted returns true if the pod's deletion timestamp is set.
|
||
|
func podIsGettingEvicted(c clientset.Interface, podNamespace, podName string) wait.ConditionFunc {
|
||
|
return func() (bool, error) {
|
||
|
pod, err := c.CoreV1().Pods(podNamespace).Get(podName, metav1.GetOptions{})
|
||
|
if err != nil {
|
||
|
return false, err
|
||
|
}
|
||
|
if pod.DeletionTimestamp != nil {
|
||
|
return true, nil
|
||
|
}
|
||
|
return false, nil
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// podScheduled returns true if a node is assigned to the given pod.
|
||
|
func podScheduled(c clientset.Interface, podNamespace, podName string) wait.ConditionFunc {
|
||
|
return func() (bool, error) {
|
||
|
pod, err := c.CoreV1().Pods(podNamespace).Get(podName, metav1.GetOptions{})
|
||
|
if errors.IsNotFound(err) {
|
||
|
return false, nil
|
||
|
}
|
||
|
if err != nil {
|
||
|
// This could be a connection error so we want to retry.
|
||
|
return false, nil
|
||
|
}
|
||
|
if pod.Spec.NodeName == "" {
|
||
|
return false, nil
|
||
|
}
|
||
|
return true, nil
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// podUnschedulable returns a condition function that returns true if the given pod
|
||
|
// gets unschedulable status.
|
||
|
func podUnschedulable(c clientset.Interface, podNamespace, podName string) wait.ConditionFunc {
|
||
|
return func() (bool, error) {
|
||
|
pod, err := c.CoreV1().Pods(podNamespace).Get(podName, metav1.GetOptions{})
|
||
|
if errors.IsNotFound(err) {
|
||
|
return false, nil
|
||
|
}
|
||
|
if err != nil {
|
||
|
// This could be a connection error so we want to retry.
|
||
|
return false, nil
|
||
|
}
|
||
|
_, cond := podutil.GetPodCondition(&pod.Status, v1.PodScheduled)
|
||
|
return cond != nil && cond.Status == v1.ConditionFalse && cond.Reason == v1.PodReasonUnschedulable, nil
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// waitForPodToScheduleWithTimeout waits for a pod to get scheduled and returns
|
||
|
// an error if it does not scheduled within the given timeout.
|
||
|
func waitForPodToScheduleWithTimeout(cs clientset.Interface, pod *v1.Pod, timeout time.Duration) error {
|
||
|
return wait.Poll(100*time.Millisecond, timeout, podScheduled(cs, pod.Namespace, pod.Name))
|
||
|
}
|
||
|
|
||
|
// waitForPodToSchedule waits for a pod to get scheduled and returns an error if
|
||
|
// it does not get scheduled within the timeout duration (30 seconds).
|
||
|
func waitForPodToSchedule(cs clientset.Interface, pod *v1.Pod) error {
|
||
|
return waitForPodToScheduleWithTimeout(cs, pod, 30*time.Second)
|
||
|
}
|
||
|
|
||
|
// deletePod deletes the given pod in the given namespace.
|
||
|
func deletePod(cs clientset.Interface, podName string, nsName string) error {
|
||
|
return cs.CoreV1().Pods(nsName).Delete(podName, metav1.NewDeleteOptions(0))
|
||
|
}
|
||
|
|
||
|
// cleanupPods deletes the given pods and waits for them to be actually deleted.
|
||
|
func cleanupPods(cs clientset.Interface, t *testing.T, pods []*v1.Pod) {
|
||
|
for _, p := range pods {
|
||
|
err := cs.CoreV1().Pods(p.Namespace).Delete(p.Name, metav1.NewDeleteOptions(0))
|
||
|
if err != nil && !errors.IsNotFound(err) {
|
||
|
t.Errorf("error while deleting pod %v/%v: %v", p.Namespace, p.Name, err)
|
||
|
}
|
||
|
}
|
||
|
for _, p := range pods {
|
||
|
if err := wait.Poll(time.Second, wait.ForeverTestTimeout, podDeleted(cs, p.Namespace, p.Name)); err != nil {
|
||
|
t.Errorf("error while waiting for pod %v/%v to get deleted: %v", p.Namespace, p.Name, err)
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// printAllPods prints a list of all the pods and their node names. This is used
|
||
|
// for debugging.
|
||
|
func printAllPods(t *testing.T, cs clientset.Interface, nsName string) {
|
||
|
podList, err := cs.CoreV1().Pods(nsName).List(metav1.ListOptions{})
|
||
|
if err != nil {
|
||
|
t.Logf("Error getting pods: %v", err)
|
||
|
}
|
||
|
for _, pod := range podList.Items {
|
||
|
t.Logf("Pod:\n\tName:%v\n\tNamespace:%v\n\tNode Name:%v\n", pod.Name, pod.Namespace, pod.Spec.NodeName)
|
||
|
}
|
||
|
}
|