
DONE: 1. refactor all predicates: predicates return fitOrNot(bool) and error(Error) in which the latter is of type PredicateFailureError or InsufficientResourceError. (For violation of either MaxEBSVolumeCount or MaxGCEPDVolumeCount, returns one same error type as ErrMaxVolumeCountExceeded) 2. GeneralPredicates() is a predicate function, which includes serveral other predicate functions (PodFitsResource, PodFitsHost, PodFitsHostPort). It is registered as one of the predicates in DefaultAlgorithmProvider, and is also called in canAdmitPod() in Kubelet and should be called by other components (like rescheduler, etc) if necessary. See discussion in issue #12744 3. remove podNumber check from GeneralPredicates 4. HostName is now verified in Kubelet's canAdminPod(). add TestHostNameConflicts in kubelet_test.go 5. add getNodeAnyWay() method in Kubelet to get node information in standaloneMode TODO: 1. determine which predicates should be included in GeneralPredicates() 2. separate GeneralPredicates() into: a. GeneralPredicatesEvictPod() and b. GeneralPredicatesNotEvictPod() 3. DaemonSet should use GeneralPredicates()
173 lines
7.4 KiB
Go
173 lines
7.4 KiB
Go
/*
|
|
Copyright 2014 The Kubernetes Authors All rights reserved.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
// This is the default algorithm provider for the scheduler.
|
|
package defaults
|
|
|
|
import (
|
|
"os"
|
|
"strconv"
|
|
|
|
"k8s.io/kubernetes/pkg/cloudprovider/providers/aws"
|
|
"k8s.io/kubernetes/pkg/util/sets"
|
|
"k8s.io/kubernetes/plugin/pkg/scheduler"
|
|
"k8s.io/kubernetes/plugin/pkg/scheduler/algorithm"
|
|
"k8s.io/kubernetes/plugin/pkg/scheduler/algorithm/predicates"
|
|
"k8s.io/kubernetes/plugin/pkg/scheduler/algorithm/priorities"
|
|
"k8s.io/kubernetes/plugin/pkg/scheduler/factory"
|
|
|
|
"github.com/golang/glog"
|
|
)
|
|
|
|
// GCE instances can have up to 16 PD volumes attached.
|
|
const DefaultMaxGCEPDVolumes = 16
|
|
|
|
// getMaxVols checks the max PD volumes environment variable, otherwise returning a default value
|
|
func getMaxVols(defaultVal int) int {
|
|
if rawMaxVols := os.Getenv("KUBE_MAX_PD_VOLS"); rawMaxVols != "" {
|
|
if parsedMaxVols, err := strconv.Atoi(rawMaxVols); err != nil {
|
|
glog.Errorf("Unable to parse maxiumum PD volumes value, using default of %v: %v", defaultVal, err)
|
|
} else if parsedMaxVols <= 0 {
|
|
glog.Errorf("Maximum PD volumes must be a positive value, using default of %v", defaultVal)
|
|
} else {
|
|
return parsedMaxVols
|
|
}
|
|
}
|
|
|
|
return defaultVal
|
|
}
|
|
|
|
func init() {
|
|
factory.RegisterAlgorithmProvider(factory.DefaultProvider, defaultPredicates(), defaultPriorities())
|
|
// EqualPriority is a prioritizer function that gives an equal weight of one to all nodes
|
|
// Register the priority function so that its available
|
|
// but do not include it as part of the default priorities
|
|
factory.RegisterPriorityFunction("EqualPriority", scheduler.EqualPriority, 1)
|
|
|
|
// ServiceSpreadingPriority is a priority config factory that spreads pods by minimizing
|
|
// the number of pods (belonging to the same service) on the same node.
|
|
// Register the factory so that it's available, but do not include it as part of the default priorities
|
|
// Largely replaced by "SelectorSpreadPriority", but registered for backward compatibility with 1.0
|
|
factory.RegisterPriorityConfigFactory(
|
|
"ServiceSpreadingPriority",
|
|
factory.PriorityConfigFactory{
|
|
Function: func(args factory.PluginFactoryArgs) algorithm.PriorityFunction {
|
|
return priorities.NewSelectorSpreadPriority(args.PodLister, args.ServiceLister, algorithm.EmptyControllerLister{}, algorithm.EmptyReplicaSetLister{})
|
|
},
|
|
Weight: 1,
|
|
},
|
|
)
|
|
// PodFitsPorts has been replaced by PodFitsHostPorts for better user understanding.
|
|
// For backwards compatibility with 1.0, PodFitsPorts is regitered as well.
|
|
factory.RegisterFitPredicate("PodFitsPorts", predicates.PodFitsHostPorts)
|
|
// ImageLocalityPriority prioritizes nodes based on locality of images requested by a pod. Nodes with larger size
|
|
// of already-installed packages required by the pod will be preferred over nodes with no already-installed
|
|
// packages required by the pod or a small total size of already-installed packages required by the pod.
|
|
factory.RegisterPriorityFunction("ImageLocalityPriority", priorities.ImageLocalityPriority, 1)
|
|
// Fit is defined based on the absence of port conflicts.
|
|
// This predicate is actually a default predicate, because it is invoked from
|
|
// predicates.GeneralPredicates()
|
|
factory.RegisterFitPredicate("PodFitsHostPorts", predicates.PodFitsHostPorts)
|
|
// Fit is determined by resource availability.
|
|
// This predicate is actually a default predicate, because it is invoked from
|
|
// predicates.GeneralPredicates()
|
|
factory.RegisterFitPredicateFactory(
|
|
"PodFitsResources",
|
|
func(args factory.PluginFactoryArgs) algorithm.FitPredicate {
|
|
return predicates.NewResourceFitPredicate(args.NodeInfo)
|
|
},
|
|
)
|
|
// Fit is determined by the presence of the Host parameter and a string match
|
|
// This predicate is actually a default predicate, because it is invoked from
|
|
// predicates.GeneralPredicates()
|
|
factory.RegisterFitPredicate("HostName", predicates.PodFitsHost)
|
|
}
|
|
|
|
func defaultPredicates() sets.String {
|
|
return sets.NewString(
|
|
// Fit is determined by non-conflicting disk volumes.
|
|
factory.RegisterFitPredicate("NoDiskConflict", predicates.NoDiskConflict),
|
|
// Fit is determined by volume zone requirements.
|
|
factory.RegisterFitPredicateFactory(
|
|
"NoVolumeZoneConflict",
|
|
func(args factory.PluginFactoryArgs) algorithm.FitPredicate {
|
|
return predicates.NewVolumeZonePredicate(args.NodeInfo, args.PVInfo, args.PVCInfo)
|
|
},
|
|
),
|
|
// Fit is determined by node selector query.
|
|
factory.RegisterFitPredicateFactory(
|
|
"MatchNodeSelector",
|
|
func(args factory.PluginFactoryArgs) algorithm.FitPredicate {
|
|
return predicates.NewSelectorMatchPredicate(args.NodeInfo)
|
|
},
|
|
),
|
|
// Fit is determined by whether or not there would be too many AWS EBS volumes attached to the node
|
|
factory.RegisterFitPredicateFactory(
|
|
"MaxEBSVolumeCount",
|
|
func(args factory.PluginFactoryArgs) algorithm.FitPredicate {
|
|
// TODO: allow for generically parameterized scheduler predicates, because this is a bit ugly
|
|
maxVols := getMaxVols(aws.DefaultMaxEBSVolumes)
|
|
return predicates.NewMaxPDVolumeCountPredicate(predicates.EBSVolumeFilter, maxVols, args.PVInfo, args.PVCInfo)
|
|
},
|
|
),
|
|
// Fit is determined by whether or not there would be too many GCE PD volumes attached to the node
|
|
factory.RegisterFitPredicateFactory(
|
|
"MaxGCEPDVolumeCount",
|
|
func(args factory.PluginFactoryArgs) algorithm.FitPredicate {
|
|
// TODO: allow for generically parameterized scheduler predicates, because this is a bit ugly
|
|
maxVols := getMaxVols(DefaultMaxGCEPDVolumes)
|
|
return predicates.NewMaxPDVolumeCountPredicate(predicates.GCEPDVolumeFilter, maxVols, args.PVInfo, args.PVCInfo)
|
|
},
|
|
),
|
|
// GeneralPredicates are the predicates that are enforced by all Kubernetes components
|
|
// (e.g. kubelet and all schedulers)
|
|
factory.RegisterFitPredicateFactory(
|
|
"GeneralPredicates",
|
|
func(args factory.PluginFactoryArgs) algorithm.FitPredicate {
|
|
return predicates.GeneralPredicates(args.NodeInfo)
|
|
},
|
|
),
|
|
)
|
|
}
|
|
|
|
func defaultPriorities() sets.String {
|
|
return sets.NewString(
|
|
// Prioritize nodes by least requested utilization.
|
|
factory.RegisterPriorityFunction("LeastRequestedPriority", priorities.LeastRequestedPriority, 1),
|
|
// Prioritizes nodes to help achieve balanced resource usage
|
|
factory.RegisterPriorityFunction("BalancedResourceAllocation", priorities.BalancedResourceAllocation, 1),
|
|
// spreads pods by minimizing the number of pods (belonging to the same service or replication controller) on the same node.
|
|
factory.RegisterPriorityConfigFactory(
|
|
"SelectorSpreadPriority",
|
|
factory.PriorityConfigFactory{
|
|
Function: func(args factory.PluginFactoryArgs) algorithm.PriorityFunction {
|
|
return priorities.NewSelectorSpreadPriority(args.PodLister, args.ServiceLister, args.ControllerLister, args.ReplicaSetLister)
|
|
},
|
|
Weight: 1,
|
|
},
|
|
),
|
|
factory.RegisterPriorityConfigFactory(
|
|
"NodeAffinityPriority",
|
|
factory.PriorityConfigFactory{
|
|
Function: func(args factory.PluginFactoryArgs) algorithm.PriorityFunction {
|
|
return priorities.NewNodeAffinityPriority(args.NodeLister)
|
|
},
|
|
Weight: 1,
|
|
},
|
|
),
|
|
)
|
|
}
|