
MultiCIDRRangeAllocator is a new Range Allocator which makes using multiple ClusterCIDRs possible. It consists of two controllers, one for reconciling the ClusterCIDR API objects and the other for allocating Pod CIDRs to the nodes. The allocation is based on the rules defined in https://github.com/kubernetes/enhancements/tree/master/keps/sig-network/2593-multiple-cluster-cidrs
174 lines
5.9 KiB
Go
174 lines
5.9 KiB
Go
/*
|
|
Copyright 2014 The Kubernetes Authors.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package nodeipam
|
|
|
|
import (
|
|
"net"
|
|
"time"
|
|
|
|
utilruntime "k8s.io/apimachinery/pkg/util/runtime"
|
|
coreinformers "k8s.io/client-go/informers/core/v1"
|
|
networkinginformers "k8s.io/client-go/informers/networking/v1alpha1"
|
|
clientset "k8s.io/client-go/kubernetes"
|
|
v1core "k8s.io/client-go/kubernetes/typed/core/v1"
|
|
corelisters "k8s.io/client-go/listers/core/v1"
|
|
"k8s.io/client-go/tools/cache"
|
|
"k8s.io/client-go/tools/record"
|
|
cloudprovider "k8s.io/cloud-provider"
|
|
controllersmetrics "k8s.io/component-base/metrics/prometheus/controllers"
|
|
"k8s.io/component-base/metrics/prometheus/ratelimiter"
|
|
"k8s.io/klog/v2"
|
|
"k8s.io/kubernetes/pkg/controller/nodeipam/ipam"
|
|
)
|
|
|
|
const (
|
|
// ipamResyncInterval is the amount of time between when the cloud and node
|
|
// CIDR range assignments are synchronized.
|
|
ipamResyncInterval = 30 * time.Second
|
|
// ipamMaxBackoff is the maximum backoff for retrying synchronization of a
|
|
// given in the error state.
|
|
ipamMaxBackoff = 10 * time.Second
|
|
// ipamInitialRetry is the initial retry interval for retrying synchronization of a
|
|
// given in the error state.
|
|
ipamInitialBackoff = 250 * time.Millisecond
|
|
)
|
|
|
|
// Controller is the controller that manages node ipam state.
|
|
type Controller struct {
|
|
allocatorType ipam.CIDRAllocatorType
|
|
|
|
cloud cloudprovider.Interface
|
|
clusterCIDRs []*net.IPNet
|
|
serviceCIDR *net.IPNet
|
|
secondaryServiceCIDR *net.IPNet
|
|
kubeClient clientset.Interface
|
|
// Method for easy mocking in unittest.
|
|
lookupIP func(host string) ([]net.IP, error)
|
|
|
|
nodeLister corelisters.NodeLister
|
|
nodeInformerSynced cache.InformerSynced
|
|
|
|
cidrAllocator ipam.CIDRAllocator
|
|
}
|
|
|
|
// NewNodeIpamController returns a new node IP Address Management controller to
|
|
// sync instances from cloudprovider.
|
|
// This method returns an error if it is unable to initialize the CIDR bitmap with
|
|
// podCIDRs it has already allocated to nodes. Since we don't allow podCIDR changes
|
|
// currently, this should be handled as a fatal error.
|
|
func NewNodeIpamController(
|
|
nodeInformer coreinformers.NodeInformer,
|
|
clusterCIDRInformer networkinginformers.ClusterCIDRInformer,
|
|
cloud cloudprovider.Interface,
|
|
kubeClient clientset.Interface,
|
|
clusterCIDRs []*net.IPNet,
|
|
serviceCIDR *net.IPNet,
|
|
secondaryServiceCIDR *net.IPNet,
|
|
nodeCIDRMaskSizes []int,
|
|
allocatorType ipam.CIDRAllocatorType) (*Controller, error) {
|
|
|
|
if kubeClient == nil {
|
|
klog.Fatalf("kubeClient is nil when starting Controller")
|
|
}
|
|
|
|
eventBroadcaster := record.NewBroadcaster()
|
|
eventBroadcaster.StartStructuredLogging(0)
|
|
|
|
klog.Infof("Sending events to api server.")
|
|
eventBroadcaster.StartRecordingToSink(
|
|
&v1core.EventSinkImpl{
|
|
Interface: kubeClient.CoreV1().Events(""),
|
|
})
|
|
|
|
if kubeClient.CoreV1().RESTClient().GetRateLimiter() != nil {
|
|
ratelimiter.RegisterMetricAndTrackRateLimiterUsage("node_ipam_controller", kubeClient.CoreV1().RESTClient().GetRateLimiter())
|
|
}
|
|
|
|
// Cloud CIDR allocator does not rely on clusterCIDR or nodeCIDRMaskSize for allocation.
|
|
if allocatorType != ipam.CloudAllocatorType {
|
|
if len(clusterCIDRs) == 0 {
|
|
klog.Fatal("Controller: Must specify --cluster-cidr if --allocate-node-cidrs is set")
|
|
}
|
|
|
|
for idx, cidr := range clusterCIDRs {
|
|
mask := cidr.Mask
|
|
if maskSize, _ := mask.Size(); maskSize > nodeCIDRMaskSizes[idx] {
|
|
klog.Fatal("Controller: Invalid --cluster-cidr, mask size of cluster CIDR must be less than or equal to --node-cidr-mask-size configured for CIDR family")
|
|
}
|
|
}
|
|
}
|
|
|
|
ic := &Controller{
|
|
cloud: cloud,
|
|
kubeClient: kubeClient,
|
|
lookupIP: net.LookupIP,
|
|
clusterCIDRs: clusterCIDRs,
|
|
serviceCIDR: serviceCIDR,
|
|
secondaryServiceCIDR: secondaryServiceCIDR,
|
|
allocatorType: allocatorType,
|
|
}
|
|
|
|
// TODO: Abstract this check into a generic controller manager should run method.
|
|
if ic.allocatorType == ipam.IPAMFromClusterAllocatorType || ic.allocatorType == ipam.IPAMFromCloudAllocatorType {
|
|
startLegacyIPAM(ic, nodeInformer, cloud, kubeClient, clusterCIDRs, serviceCIDR, nodeCIDRMaskSizes)
|
|
} else {
|
|
var err error
|
|
|
|
allocatorParams := ipam.CIDRAllocatorParams{
|
|
ClusterCIDRs: clusterCIDRs,
|
|
ServiceCIDR: ic.serviceCIDR,
|
|
SecondaryServiceCIDR: ic.secondaryServiceCIDR,
|
|
NodeCIDRMaskSizes: nodeCIDRMaskSizes,
|
|
}
|
|
|
|
ic.cidrAllocator, err = ipam.New(kubeClient, cloud, nodeInformer, clusterCIDRInformer, ic.allocatorType, allocatorParams)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
}
|
|
|
|
ic.nodeLister = nodeInformer.Lister()
|
|
ic.nodeInformerSynced = nodeInformer.Informer().HasSynced
|
|
|
|
return ic, nil
|
|
}
|
|
|
|
// Run starts an asynchronous loop that monitors the status of cluster nodes.
|
|
func (nc *Controller) Run(stopCh <-chan struct{}) {
|
|
defer utilruntime.HandleCrash()
|
|
|
|
klog.Infof("Starting ipam controller")
|
|
defer klog.Infof("Shutting down ipam controller")
|
|
|
|
if !cache.WaitForNamedCacheSync("node", stopCh, nc.nodeInformerSynced) {
|
|
return
|
|
}
|
|
|
|
if nc.allocatorType != ipam.IPAMFromClusterAllocatorType && nc.allocatorType != ipam.IPAMFromCloudAllocatorType {
|
|
go nc.cidrAllocator.Run(stopCh)
|
|
}
|
|
|
|
<-stopCh
|
|
}
|
|
|
|
// RunWithMetrics is a wrapper for Run that also tracks starting and stopping of the nodeipam controller with additional metric
|
|
func (nc *Controller) RunWithMetrics(stopCh <-chan struct{}, controllerManagerMetrics *controllersmetrics.ControllerManagerMetrics) {
|
|
controllerManagerMetrics.ControllerStarted("nodeipam")
|
|
defer controllerManagerMetrics.ControllerStopped("nodeipam")
|
|
nc.Run(stopCh)
|
|
}
|