
Automatic merge from submit-queue. If you want to cherry-pick this change to another branch, please follow the instructions <a href="https://github.com/kubernetes/community/blob/master/contributors/devel/cherry-picks.md">here</a>. openstack: remove orphaned routes from terminated instances **What this PR does / why we need it**: At the moment the openstack cloudprovider only returns routes where the `NextHop` address points to an existing openstack instance. This is a problem when an instance is terminated before the corresponding node is removed from k8s. The existing route is not returned by the cloudprovider anymore and therefore never considered for deletion by the route controller. When the route's `DestinationCIDR` is reassigned to a new node the router ends up with two routes pointing to a different `NextHop` leading to broken networking. This PR removes skipping routes pointing to unknown next hops when listing routes. This should cause [this conditional](93dc3763b0/pkg/controller/route/route_controller.go (L208)
) in the route controller to succeed and have the route removed if the route controller [feels responsible](93dc3763b0/pkg/controller/route/route_controller.go (L206)
). ```release-note OpenStack cloudprovider: Ensure orphaned routes are removed. ```
320 lines
7.7 KiB
Go
320 lines
7.7 KiB
Go
/*
|
|
Copyright 2016 The Kubernetes Authors.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package openstack
|
|
|
|
import (
|
|
"errors"
|
|
|
|
"github.com/gophercloud/gophercloud"
|
|
"github.com/gophercloud/gophercloud/openstack/compute/v2/servers"
|
|
"github.com/gophercloud/gophercloud/openstack/networking/v2/extensions/layer3/routers"
|
|
neutronports "github.com/gophercloud/gophercloud/openstack/networking/v2/ports"
|
|
|
|
"github.com/golang/glog"
|
|
"k8s.io/apimachinery/pkg/types"
|
|
"k8s.io/kubernetes/pkg/cloudprovider"
|
|
)
|
|
|
|
var ErrNoRouterId = errors.New("router-id not set in cloud provider config")
|
|
|
|
type Routes struct {
|
|
compute *gophercloud.ServiceClient
|
|
network *gophercloud.ServiceClient
|
|
opts RouterOpts
|
|
}
|
|
|
|
func NewRoutes(compute *gophercloud.ServiceClient, network *gophercloud.ServiceClient, opts RouterOpts) (cloudprovider.Routes, error) {
|
|
if opts.RouterId == "" {
|
|
return nil, ErrNoRouterId
|
|
}
|
|
|
|
return &Routes{
|
|
compute: compute,
|
|
network: network,
|
|
opts: opts,
|
|
}, nil
|
|
}
|
|
|
|
func (r *Routes) ListRoutes(clusterName string) ([]*cloudprovider.Route, error) {
|
|
glog.V(4).Infof("ListRoutes(%v)", clusterName)
|
|
|
|
nodeNamesByAddr := make(map[string]types.NodeName)
|
|
err := foreachServer(r.compute, servers.ListOpts{}, func(srv *servers.Server) (bool, error) {
|
|
addrs, err := nodeAddresses(srv)
|
|
if err != nil {
|
|
return false, err
|
|
}
|
|
|
|
name := mapServerToNodeName(srv)
|
|
for _, addr := range addrs {
|
|
nodeNamesByAddr[addr.Address] = name
|
|
}
|
|
|
|
return true, nil
|
|
})
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
router, err := routers.Get(r.network, r.opts.RouterId).Extract()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
var routes []*cloudprovider.Route
|
|
for _, item := range router.Routes {
|
|
nodeName, foundNode := nodeNamesByAddr[item.NextHop]
|
|
route := cloudprovider.Route{
|
|
Name: item.DestinationCIDR,
|
|
TargetNode: nodeName, //empty if NextHop is unknown
|
|
Blackhole: !foundNode,
|
|
DestinationCIDR: item.DestinationCIDR,
|
|
}
|
|
routes = append(routes, &route)
|
|
}
|
|
|
|
return routes, nil
|
|
}
|
|
|
|
func updateRoutes(network *gophercloud.ServiceClient, router *routers.Router, newRoutes []routers.Route) (func(), error) {
|
|
origRoutes := router.Routes // shallow copy
|
|
|
|
_, err := routers.Update(network, router.ID, routers.UpdateOpts{
|
|
Routes: newRoutes,
|
|
}).Extract()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
unwinder := func() {
|
|
glog.V(4).Info("Reverting routes change to router ", router.ID)
|
|
_, err := routers.Update(network, router.ID, routers.UpdateOpts{
|
|
Routes: origRoutes,
|
|
}).Extract()
|
|
if err != nil {
|
|
glog.Warning("Unable to reset routes during error unwind: ", err)
|
|
}
|
|
}
|
|
|
|
return unwinder, nil
|
|
}
|
|
|
|
func updateAllowedAddressPairs(network *gophercloud.ServiceClient, port *neutronports.Port, newPairs []neutronports.AddressPair) (func(), error) {
|
|
origPairs := port.AllowedAddressPairs // shallow copy
|
|
|
|
_, err := neutronports.Update(network, port.ID, neutronports.UpdateOpts{
|
|
AllowedAddressPairs: &newPairs,
|
|
}).Extract()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
unwinder := func() {
|
|
glog.V(4).Info("Reverting allowed-address-pairs change to port ", port.ID)
|
|
_, err := neutronports.Update(network, port.ID, neutronports.UpdateOpts{
|
|
AllowedAddressPairs: &origPairs,
|
|
}).Extract()
|
|
if err != nil {
|
|
glog.Warning("Unable to reset allowed-address-pairs during error unwind: ", err)
|
|
}
|
|
}
|
|
|
|
return unwinder, nil
|
|
}
|
|
|
|
func (r *Routes) CreateRoute(clusterName string, nameHint string, route *cloudprovider.Route) error {
|
|
glog.V(4).Infof("CreateRoute(%v, %v, %v)", clusterName, nameHint, route)
|
|
|
|
onFailure := NewCaller()
|
|
|
|
addr, err := getAddressByName(r.compute, route.TargetNode)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
glog.V(4).Infof("Using nexthop %v for node %v", addr, route.TargetNode)
|
|
|
|
router, err := routers.Get(r.network, r.opts.RouterId).Extract()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
routes := router.Routes
|
|
|
|
for _, item := range routes {
|
|
if item.DestinationCIDR == route.DestinationCIDR && item.NextHop == addr {
|
|
glog.V(4).Infof("Skipping existing route: %v", route)
|
|
return nil
|
|
}
|
|
}
|
|
|
|
routes = append(routes, routers.Route{
|
|
DestinationCIDR: route.DestinationCIDR,
|
|
NextHop: addr,
|
|
})
|
|
|
|
unwind, err := updateRoutes(r.network, router, routes)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer onFailure.Call(unwind)
|
|
|
|
// get the port of addr on target node.
|
|
portID, err := getPortIDByIP(r.compute, route.TargetNode, addr)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
port, err := getPortByID(r.network, portID)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
found := false
|
|
for _, item := range port.AllowedAddressPairs {
|
|
if item.IPAddress == route.DestinationCIDR {
|
|
glog.V(4).Info("Found existing allowed-address-pair: ", item)
|
|
found = true
|
|
break
|
|
}
|
|
}
|
|
|
|
if !found {
|
|
newPairs := append(port.AllowedAddressPairs, neutronports.AddressPair{
|
|
IPAddress: route.DestinationCIDR,
|
|
})
|
|
unwind, err := updateAllowedAddressPairs(r.network, port, newPairs)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer onFailure.Call(unwind)
|
|
}
|
|
|
|
glog.V(4).Infof("Route created: %v", route)
|
|
onFailure.Disarm()
|
|
return nil
|
|
}
|
|
|
|
func (r *Routes) DeleteRoute(clusterName string, route *cloudprovider.Route) error {
|
|
glog.V(4).Infof("DeleteRoute(%v, %v)", clusterName, route)
|
|
|
|
onFailure := NewCaller()
|
|
|
|
addr, err := getAddressByName(r.compute, route.TargetNode)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
router, err := routers.Get(r.network, r.opts.RouterId).Extract()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
routes := router.Routes
|
|
index := -1
|
|
for i, item := range routes {
|
|
if item.DestinationCIDR == route.DestinationCIDR && item.NextHop == addr {
|
|
index = i
|
|
break
|
|
}
|
|
}
|
|
|
|
if index == -1 {
|
|
glog.V(4).Infof("Skipping non-existent route: %v", route)
|
|
return nil
|
|
}
|
|
|
|
// Delete element `index`
|
|
routes[index] = routes[len(routes)-1]
|
|
routes = routes[:len(routes)-1]
|
|
|
|
unwind, err := updateRoutes(r.network, router, routes)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer onFailure.Call(unwind)
|
|
|
|
// get the port of addr on target node.
|
|
portID, err := getPortIDByIP(r.compute, route.TargetNode, addr)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
port, err := getPortByID(r.network, portID)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
addr_pairs := port.AllowedAddressPairs
|
|
index = -1
|
|
for i, item := range addr_pairs {
|
|
if item.IPAddress == route.DestinationCIDR {
|
|
index = i
|
|
break
|
|
}
|
|
}
|
|
|
|
if index != -1 {
|
|
// Delete element `index`
|
|
addr_pairs[index] = addr_pairs[len(addr_pairs)-1]
|
|
addr_pairs = addr_pairs[:len(addr_pairs)-1]
|
|
|
|
unwind, err := updateAllowedAddressPairs(r.network, port, addr_pairs)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer onFailure.Call(unwind)
|
|
}
|
|
|
|
glog.V(4).Infof("Route deleted: %v", route)
|
|
onFailure.Disarm()
|
|
return nil
|
|
}
|
|
|
|
func getPortIDByIP(compute *gophercloud.ServiceClient, targetNode types.NodeName, ipAddress string) (string, error) {
|
|
srv, err := getServerByName(compute, targetNode, true)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
|
|
interfaces, err := getAttachedInterfacesByID(compute, srv.ID)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
|
|
for _, intf := range interfaces {
|
|
for _, fixedIP := range intf.FixedIPs {
|
|
if fixedIP.IPAddress == ipAddress {
|
|
return intf.PortID, nil
|
|
}
|
|
}
|
|
}
|
|
|
|
return "", ErrNotFound
|
|
}
|
|
|
|
func getPortByID(client *gophercloud.ServiceClient, portID string) (*neutronports.Port, error) {
|
|
targetPort, err := neutronports.Get(client, portID).Extract()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
if targetPort == nil {
|
|
return nil, ErrNotFound
|
|
}
|
|
|
|
return targetPort, nil
|
|
}
|