
For AWS EBS, a volume can only be attached to a node in the same AZ. The scheduler must therefore detect if a volume is being attached to a pod, and ensure that the pod is scheduled on a node in the same AZ as the volume. So that the scheduler need not query the cloud provider every time, and to support decoupled operation (e.g. bare metal) we tag the volume with our placement labels. This is done automatically by means of an admission controller on AWS when a PersistentVolume is created backed by an EBS volume. Support for tagging GCE PVs will follow. Pods that specify a volume directly (i.e. without using a PersistentVolumeClaim) will not currently be scheduled correctly (i.e. they will be scheduled without zone-awareness).
104 lines
4.3 KiB
Go
104 lines
4.3 KiB
Go
/*
|
|
Copyright 2014 The Kubernetes Authors All rights reserved.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
// This is the default algorithm provider for the scheduler.
|
|
package defaults
|
|
|
|
import (
|
|
"k8s.io/kubernetes/pkg/util/sets"
|
|
"k8s.io/kubernetes/plugin/pkg/scheduler"
|
|
"k8s.io/kubernetes/plugin/pkg/scheduler/algorithm"
|
|
"k8s.io/kubernetes/plugin/pkg/scheduler/algorithm/predicates"
|
|
"k8s.io/kubernetes/plugin/pkg/scheduler/algorithm/priorities"
|
|
"k8s.io/kubernetes/plugin/pkg/scheduler/factory"
|
|
)
|
|
|
|
func init() {
|
|
factory.RegisterAlgorithmProvider(factory.DefaultProvider, defaultPredicates(), defaultPriorities())
|
|
// EqualPriority is a prioritizer function that gives an equal weight of one to all nodes
|
|
// Register the priority function so that its available
|
|
// but do not include it as part of the default priorities
|
|
factory.RegisterPriorityFunction("EqualPriority", scheduler.EqualPriority, 1)
|
|
|
|
// ServiceSpreadingPriority is a priority config factory that spreads pods by minimizing
|
|
// the number of pods (belonging to the same service) on the same node.
|
|
// Register the factory so that it's available, but do not include it as part of the default priorities
|
|
// Largely replaced by "SelectorSpreadPriority", but registered for backward compatibility with 1.0
|
|
factory.RegisterPriorityConfigFactory(
|
|
"ServiceSpreadingPriority",
|
|
factory.PriorityConfigFactory{
|
|
Function: func(args factory.PluginFactoryArgs) algorithm.PriorityFunction {
|
|
return priorities.NewSelectorSpreadPriority(args.ServiceLister, algorithm.EmptyControllerLister{})
|
|
},
|
|
Weight: 1,
|
|
},
|
|
)
|
|
// PodFitsPorts has been replaced by PodFitsHostPorts for better user understanding.
|
|
// For backwards compatibility with 1.0, PodFitsPorts is regitered as well.
|
|
factory.RegisterFitPredicate("PodFitsPorts", predicates.PodFitsHostPorts)
|
|
}
|
|
|
|
func defaultPredicates() sets.String {
|
|
return sets.NewString(
|
|
// Fit is defined based on the absence of port conflicts.
|
|
factory.RegisterFitPredicate("PodFitsHostPorts", predicates.PodFitsHostPorts),
|
|
// Fit is determined by resource availability.
|
|
factory.RegisterFitPredicateFactory(
|
|
"PodFitsResources",
|
|
func(args factory.PluginFactoryArgs) algorithm.FitPredicate {
|
|
return predicates.NewResourceFitPredicate(args.NodeInfo)
|
|
},
|
|
),
|
|
// Fit is determined by non-conflicting disk volumes.
|
|
factory.RegisterFitPredicate("NoDiskConflict", predicates.NoDiskConflict),
|
|
// Fit is determined by volume zone requirements.
|
|
factory.RegisterFitPredicateFactory(
|
|
"NoVolumeZoneConflict",
|
|
func(args factory.PluginFactoryArgs) algorithm.FitPredicate {
|
|
return predicates.NewVolumeZonePredicate(args.NodeInfo, args.PVInfo, args.PVCInfo)
|
|
},
|
|
),
|
|
// Fit is determined by node selector query.
|
|
factory.RegisterFitPredicateFactory(
|
|
"MatchNodeSelector",
|
|
func(args factory.PluginFactoryArgs) algorithm.FitPredicate {
|
|
return predicates.NewSelectorMatchPredicate(args.NodeInfo)
|
|
},
|
|
),
|
|
// Fit is determined by the presence of the Host parameter and a string match
|
|
factory.RegisterFitPredicate("HostName", predicates.PodFitsHost),
|
|
)
|
|
}
|
|
|
|
func defaultPriorities() sets.String {
|
|
return sets.NewString(
|
|
// Prioritize nodes by least requested utilization.
|
|
factory.RegisterPriorityFunction("LeastRequestedPriority", priorities.LeastRequestedPriority, 1),
|
|
// Prioritizes nodes to help achieve balanced resource usage
|
|
factory.RegisterPriorityFunction("BalancedResourceAllocation", priorities.BalancedResourceAllocation, 1),
|
|
// spreads pods by minimizing the number of pods (belonging to the same service or replication controller) on the same node.
|
|
factory.RegisterPriorityConfigFactory(
|
|
"SelectorSpreadPriority",
|
|
factory.PriorityConfigFactory{
|
|
Function: func(args factory.PluginFactoryArgs) algorithm.PriorityFunction {
|
|
return priorities.NewSelectorSpreadPriority(args.ServiceLister, args.ControllerLister)
|
|
},
|
|
Weight: 1,
|
|
},
|
|
),
|
|
)
|
|
}
|