
Like the current device plugin interface, a DRA driver using this model announces a list of resource instances. In contrast to device plugins, this list is made available to the scheduler together with attributes that can be used to select suitable instances when they are not all alike. Because this is the first structured parameter model, some checks that previously were not possible, in particular "is one structured parameter field set", now gets enabled. Adding another structured parameter model will be similar. The applyconfigs code generator assumes that all types in an API are defined in a single package. If it wasn't for that, it would be possible to place the "named resources" types in separate packages, which makes their names in the Go code more natural and provides an indication of their stability level because the package name could include a version.
236 lines
8.3 KiB
Go
236 lines
8.3 KiB
Go
/*
|
|
Copyright 2024 The Kubernetes Authors.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package dynamicresources
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
|
|
v1 "k8s.io/api/core/v1"
|
|
resourcev1alpha2 "k8s.io/api/resource/v1alpha2"
|
|
"k8s.io/apimachinery/pkg/labels"
|
|
"k8s.io/apimachinery/pkg/runtime"
|
|
resourcev1alpha2listers "k8s.io/client-go/listers/resource/v1alpha2"
|
|
"k8s.io/klog/v2"
|
|
namedresourcesmodel "k8s.io/kubernetes/pkg/scheduler/framework/plugins/dynamicresources/structured/namedresources"
|
|
"k8s.io/kubernetes/pkg/scheduler/framework/plugins/volumebinding"
|
|
)
|
|
|
|
// resources is a map "node name" -> "driver name" -> available and
|
|
// allocated resources per structured parameter model.
|
|
type resources map[string]map[string]resourceModels
|
|
|
|
// resourceModels may have more than one entry because it is valid for a driver to
|
|
// use more than one structured parameter model.
|
|
type resourceModels struct {
|
|
namedresources namedresourcesmodel.Model
|
|
}
|
|
|
|
// newResourceModel parses the available information about resources. Objects
|
|
// with an unknown structured parameter model silently ignored. An error gets
|
|
// logged later when parameters required for a pod depend on such an unknown
|
|
// model.
|
|
func newResourceModel(logger klog.Logger, nodeResourceSliceLister resourcev1alpha2listers.NodeResourceSliceLister, claimAssumeCache volumebinding.AssumeCache) (resources, error) {
|
|
model := make(resources)
|
|
|
|
slices, err := nodeResourceSliceLister.List(labels.Everything())
|
|
if err != nil {
|
|
return nil, fmt.Errorf("list node resource slices: %w", err)
|
|
}
|
|
for _, slice := range slices {
|
|
if model[slice.NodeName] == nil {
|
|
model[slice.NodeName] = make(map[string]resourceModels)
|
|
}
|
|
resource := model[slice.NodeName][slice.DriverName]
|
|
namedresourcesmodel.AddResources(&resource.namedresources, slice.NamedResources)
|
|
model[slice.NodeName][slice.DriverName] = resource
|
|
}
|
|
|
|
objs := claimAssumeCache.List(nil)
|
|
for _, obj := range objs {
|
|
claim, ok := obj.(*resourcev1alpha2.ResourceClaim)
|
|
if !ok {
|
|
return nil, fmt.Errorf("got unexpected object of type %T from claim assume cache", obj)
|
|
}
|
|
if claim.Status.Allocation == nil {
|
|
continue
|
|
}
|
|
for _, handle := range claim.Status.Allocation.ResourceHandles {
|
|
structured := handle.StructuredData
|
|
if structured == nil {
|
|
continue
|
|
}
|
|
if model[structured.NodeName] == nil {
|
|
model[structured.NodeName] = make(map[string]resourceModels)
|
|
}
|
|
resource := model[structured.NodeName][handle.DriverName]
|
|
for _, result := range structured.Results {
|
|
// Call AddAllocation for each known model. Each call itself needs to check for nil.
|
|
namedresourcesmodel.AddAllocation(&resource.namedresources, result.NamedResources)
|
|
}
|
|
}
|
|
}
|
|
|
|
return model, nil
|
|
}
|
|
|
|
func newClaimController(logger klog.Logger, class *resourcev1alpha2.ResourceClass, classParameters *resourcev1alpha2.ResourceClassParameters, claimParameters *resourcev1alpha2.ResourceClaimParameters) (*claimController, error) {
|
|
// Each node driver is separate from the others. Each driver may have
|
|
// multiple requests which need to be allocated together, so here
|
|
// we have to collect them per model.
|
|
type perDriverRequests struct {
|
|
parameters []runtime.RawExtension
|
|
requests []*resourcev1alpha2.NamedResourcesRequest
|
|
}
|
|
namedresourcesRequests := make(map[string]perDriverRequests)
|
|
for i, request := range claimParameters.DriverRequests {
|
|
driverName := request.DriverName
|
|
p := namedresourcesRequests[driverName]
|
|
for e, request := range request.Requests {
|
|
switch {
|
|
case request.ResourceRequestModel.NamedResources != nil:
|
|
p.parameters = append(p.parameters, request.VendorParameters)
|
|
p.requests = append(p.requests, request.ResourceRequestModel.NamedResources)
|
|
default:
|
|
return nil, fmt.Errorf("claim parameters %s: driverRequersts[%d].requests[%d]: no supported structured parameters found", klog.KObj(claimParameters), i, e)
|
|
}
|
|
}
|
|
if len(p.requests) > 0 {
|
|
namedresourcesRequests[driverName] = p
|
|
}
|
|
}
|
|
|
|
c := &claimController{
|
|
class: class,
|
|
classParameters: classParameters,
|
|
claimParameters: claimParameters,
|
|
namedresources: make(map[string]perDriverController, len(namedresourcesRequests)),
|
|
}
|
|
for driverName, perDriver := range namedresourcesRequests {
|
|
var filter *resourcev1alpha2.NamedResourcesFilter
|
|
if classParameters != nil {
|
|
for _, f := range classParameters.Filters {
|
|
if f.DriverName == driverName && f.ResourceFilterModel.NamedResources != nil {
|
|
filter = f.ResourceFilterModel.NamedResources
|
|
break
|
|
}
|
|
}
|
|
}
|
|
controller, err := namedresourcesmodel.NewClaimController(filter, perDriver.requests)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("creating claim controller for named resources structured model: %w", err)
|
|
}
|
|
c.namedresources[driverName] = perDriverController{
|
|
parameters: perDriver.parameters,
|
|
controller: controller,
|
|
}
|
|
}
|
|
return c, nil
|
|
}
|
|
|
|
// claimController currently wraps exactly one structured parameter model.
|
|
|
|
type claimController struct {
|
|
class *resourcev1alpha2.ResourceClass
|
|
classParameters *resourcev1alpha2.ResourceClassParameters
|
|
claimParameters *resourcev1alpha2.ResourceClaimParameters
|
|
namedresources map[string]perDriverController
|
|
}
|
|
|
|
type perDriverController struct {
|
|
parameters []runtime.RawExtension
|
|
controller *namedresourcesmodel.Controller
|
|
}
|
|
|
|
func (c claimController) nodeIsSuitable(ctx context.Context, nodeName string, resources resources) (bool, error) {
|
|
nodeResources := resources[nodeName]
|
|
for driverName, perDriver := range c.namedresources {
|
|
okay, err := perDriver.controller.NodeIsSuitable(ctx, nodeResources[driverName].namedresources)
|
|
if err != nil {
|
|
// This is an error in the CEL expression which needs
|
|
// to be fixed. Better fail very visibly instead of
|
|
// ignoring the node.
|
|
return false, fmt.Errorf("checking node %q and resources of driver %q: %w", nodeName, driverName, err)
|
|
}
|
|
if !okay {
|
|
return false, nil
|
|
}
|
|
}
|
|
return true, nil
|
|
}
|
|
|
|
func (c claimController) allocate(ctx context.Context, nodeName string, resources resources) (string, *resourcev1alpha2.AllocationResult, error) {
|
|
allocation := &resourcev1alpha2.AllocationResult{
|
|
Shareable: c.claimParameters.Shareable,
|
|
AvailableOnNodes: &v1.NodeSelector{
|
|
NodeSelectorTerms: []v1.NodeSelectorTerm{
|
|
{
|
|
MatchExpressions: []v1.NodeSelectorRequirement{
|
|
{Key: "kubernetes.io/hostname", Operator: v1.NodeSelectorOpIn, Values: []string{nodeName}},
|
|
},
|
|
},
|
|
},
|
|
},
|
|
}
|
|
|
|
nodeResources := resources[nodeName]
|
|
for driverName, perDriver := range c.namedresources {
|
|
// Must return one entry for each request. The entry may be nil. This way,
|
|
// the result can be correlated with the per-request parameters.
|
|
results, err := perDriver.controller.Allocate(ctx, nodeResources[driverName].namedresources)
|
|
if err != nil {
|
|
return "", nil, fmt.Errorf("allocating via named resources structured model: %w", err)
|
|
}
|
|
handle := resourcev1alpha2.ResourceHandle{
|
|
DriverName: driverName,
|
|
StructuredData: &resourcev1alpha2.StructuredResourceHandle{
|
|
NodeName: nodeName,
|
|
},
|
|
}
|
|
for i, result := range results {
|
|
if result == nil {
|
|
continue
|
|
}
|
|
handle.StructuredData.Results = append(handle.StructuredData.Results,
|
|
resourcev1alpha2.DriverAllocationResult{
|
|
VendorRequestParameters: perDriver.parameters[i],
|
|
AllocationResultModel: resourcev1alpha2.AllocationResultModel{
|
|
NamedResources: result,
|
|
},
|
|
},
|
|
)
|
|
}
|
|
if c.classParameters != nil {
|
|
for _, p := range c.classParameters.VendorParameters {
|
|
if p.DriverName == driverName {
|
|
handle.StructuredData.VendorClassParameters = p.Parameters
|
|
break
|
|
}
|
|
}
|
|
}
|
|
for _, request := range c.claimParameters.DriverRequests {
|
|
if request.DriverName == driverName {
|
|
handle.StructuredData.VendorClaimParameters = request.VendorParameters
|
|
break
|
|
}
|
|
}
|
|
allocation.ResourceHandles = append(allocation.ResourceHandles, handle)
|
|
}
|
|
|
|
return c.class.DriverName, allocation, nil
|
|
}
|