make eviction message more clear
This commit is contained in:
@@ -388,7 +388,7 @@ func (m *managerImpl) synchronize(diskInfoProvider DiskInfoProvider, podFunc Act
|
|||||||
if !isHardEvictionThreshold(thresholdToReclaim) {
|
if !isHardEvictionThreshold(thresholdToReclaim) {
|
||||||
gracePeriodOverride = m.config.MaxPodGracePeriodSeconds
|
gracePeriodOverride = m.config.MaxPodGracePeriodSeconds
|
||||||
}
|
}
|
||||||
message, annotations := evictionMessage(resourceToReclaim, pod, statsFunc)
|
message, annotations := evictionMessage(resourceToReclaim, pod, statsFunc, thresholds, observations)
|
||||||
var condition *v1.PodCondition
|
var condition *v1.PodCondition
|
||||||
if utilfeature.DefaultFeatureGate.Enabled(features.PodDisruptionConditions) {
|
if utilfeature.DefaultFeatureGate.Enabled(features.PodDisruptionConditions) {
|
||||||
condition = &v1.PodCondition{
|
condition = &v1.PodCondition{
|
||||||
|
@@ -195,7 +195,7 @@ func TestMemoryPressure_VerifyPodStatus(t *testing.T) {
|
|||||||
wantPodStatus: v1.PodStatus{
|
wantPodStatus: v1.PodStatus{
|
||||||
Phase: v1.PodFailed,
|
Phase: v1.PodFailed,
|
||||||
Reason: "Evicted",
|
Reason: "Evicted",
|
||||||
Message: "The node was low on resource: memory. ",
|
Message: "The node was low on resource: memory. Threshold quantity: 2Gi, available: 1500Mi. ",
|
||||||
},
|
},
|
||||||
},
|
},
|
||||||
}
|
}
|
||||||
@@ -272,7 +272,7 @@ func TestMemoryPressure_VerifyPodStatus(t *testing.T) {
|
|||||||
Type: "DisruptionTarget",
|
Type: "DisruptionTarget",
|
||||||
Status: "True",
|
Status: "True",
|
||||||
Reason: "TerminationByKubelet",
|
Reason: "TerminationByKubelet",
|
||||||
Message: "The node was low on resource: memory. ",
|
Message: "The node was low on resource: memory. Threshold quantity: 2Gi, available: 1500Mi. ",
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -296,7 +296,7 @@ func TestDiskPressureNodeFs_VerifyPodStatus(t *testing.T) {
|
|||||||
wantPodStatus: v1.PodStatus{
|
wantPodStatus: v1.PodStatus{
|
||||||
Phase: v1.PodFailed,
|
Phase: v1.PodFailed,
|
||||||
Reason: "Evicted",
|
Reason: "Evicted",
|
||||||
Message: "The node was low on resource: ephemeral-storage. ",
|
Message: "The node was low on resource: ephemeral-storage. Threshold quantity: 2Gi, available: 1536Mi. ",
|
||||||
},
|
},
|
||||||
},
|
},
|
||||||
}
|
}
|
||||||
@@ -373,7 +373,7 @@ func TestDiskPressureNodeFs_VerifyPodStatus(t *testing.T) {
|
|||||||
Type: "DisruptionTarget",
|
Type: "DisruptionTarget",
|
||||||
Status: "True",
|
Status: "True",
|
||||||
Reason: "TerminationByKubelet",
|
Reason: "TerminationByKubelet",
|
||||||
Message: "The node was low on resource: ephemeral-storage. ",
|
Message: "The node was low on resource: ephemeral-storage. Threshold quantity: 2Gi, available: 1536Mi. ",
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@@ -43,7 +43,7 @@ const (
|
|||||||
// nodeConditionMessageFmt is the message for evictions due to resource pressure.
|
// nodeConditionMessageFmt is the message for evictions due to resource pressure.
|
||||||
nodeConditionMessageFmt = "The node had condition: %v. "
|
nodeConditionMessageFmt = "The node had condition: %v. "
|
||||||
// containerMessageFmt provides additional information for containers exceeding requests
|
// containerMessageFmt provides additional information for containers exceeding requests
|
||||||
containerMessageFmt = "Container %s was using %s, which exceeds its request of %s. "
|
containerMessageFmt = "Container %s was using %s, request is %s, has larger consumption of %v. "
|
||||||
// containerEphemeralStorageMessageFmt provides additional information for containers which have exceeded their ES limit
|
// containerEphemeralStorageMessageFmt provides additional information for containers which have exceeded their ES limit
|
||||||
containerEphemeralStorageMessageFmt = "Container %s exceeded its local ephemeral storage limit %q. "
|
containerEphemeralStorageMessageFmt = "Container %s exceeded its local ephemeral storage limit %q. "
|
||||||
// podEphemeralStorageMessageFmt provides additional information for pods which have exceeded their ES limit
|
// podEphemeralStorageMessageFmt provides additional information for pods which have exceeded their ES limit
|
||||||
@@ -60,6 +60,8 @@ const (
|
|||||||
OffendingContainersUsageKey = "offending_containers_usage"
|
OffendingContainersUsageKey = "offending_containers_usage"
|
||||||
// StarvedResourceKey is the key for the starved resource in eviction event annotations
|
// StarvedResourceKey is the key for the starved resource in eviction event annotations
|
||||||
StarvedResourceKey = "starved_resource"
|
StarvedResourceKey = "starved_resource"
|
||||||
|
// thresholdMetMessageFmt is the message for evictions due to resource pressure.
|
||||||
|
thresholdMetMessageFmt = "Threshold quantity: %v, available: %v. "
|
||||||
)
|
)
|
||||||
|
|
||||||
var (
|
var (
|
||||||
@@ -999,9 +1001,13 @@ func buildSignalToNodeReclaimFuncs(imageGC ImageGC, containerGC ContainerGC, wit
|
|||||||
}
|
}
|
||||||
|
|
||||||
// evictionMessage constructs a useful message about why an eviction occurred, and annotations to provide metadata about the eviction
|
// evictionMessage constructs a useful message about why an eviction occurred, and annotations to provide metadata about the eviction
|
||||||
func evictionMessage(resourceToReclaim v1.ResourceName, pod *v1.Pod, stats statsFunc) (message string, annotations map[string]string) {
|
func evictionMessage(resourceToReclaim v1.ResourceName, pod *v1.Pod, stats statsFunc, thresholds []evictionapi.Threshold, observations signalObservations) (message string, annotations map[string]string) {
|
||||||
annotations = make(map[string]string)
|
annotations = make(map[string]string)
|
||||||
message = fmt.Sprintf(nodeLowMessageFmt, resourceToReclaim)
|
message = fmt.Sprintf(nodeLowMessageFmt, resourceToReclaim)
|
||||||
|
quantity, available := getThresholdMetInfo(resourceToReclaim, thresholds, observations)
|
||||||
|
if quantity != nil && available != nil {
|
||||||
|
message += fmt.Sprintf(thresholdMetMessageFmt, quantity, available)
|
||||||
|
}
|
||||||
containers := []string{}
|
containers := []string{}
|
||||||
containerUsage := []string{}
|
containerUsage := []string{}
|
||||||
podStats, ok := stats(pod)
|
podStats, ok := stats(pod)
|
||||||
@@ -1024,7 +1030,7 @@ func evictionMessage(resourceToReclaim v1.ResourceName, pod *v1.Pod, stats stats
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
if usage != nil && usage.Cmp(requests) > 0 {
|
if usage != nil && usage.Cmp(requests) > 0 {
|
||||||
message += fmt.Sprintf(containerMessageFmt, container.Name, usage.String(), requests.String())
|
message += fmt.Sprintf(containerMessageFmt, container.Name, usage.String(), requests.String(), resourceToReclaim)
|
||||||
containers = append(containers, container.Name)
|
containers = append(containers, container.Name)
|
||||||
containerUsage = append(containerUsage, usage.String())
|
containerUsage = append(containerUsage, usage.String())
|
||||||
}
|
}
|
||||||
@@ -1036,3 +1042,18 @@ func evictionMessage(resourceToReclaim v1.ResourceName, pod *v1.Pod, stats stats
|
|||||||
annotations[StarvedResourceKey] = string(resourceToReclaim)
|
annotations[StarvedResourceKey] = string(resourceToReclaim)
|
||||||
return
|
return
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// getThresholdMetInfo get the threshold quantity and available for the resource resourceToReclaim
|
||||||
|
func getThresholdMetInfo(resourceToReclaim v1.ResourceName, thresholds []evictionapi.Threshold, observations signalObservations) (quantity *resource.Quantity, available *resource.Quantity) {
|
||||||
|
for i := range thresholds {
|
||||||
|
threshold := thresholds[i]
|
||||||
|
if signalToResource[threshold.Signal] == resourceToReclaim {
|
||||||
|
observed, found := observations[threshold.Signal]
|
||||||
|
if found {
|
||||||
|
quantity := evictionapi.GetThresholdQuantity(threshold.Value, observed.capacity)
|
||||||
|
return quantity, observed.available
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return nil, nil
|
||||||
|
}
|
||||||
|
Reference in New Issue
Block a user