Log failed state updates correctly
Signed-off-by: Arjun Naik <arjun@arjunnaik.in>
This commit is contained in:
parent
0183d5548e
commit
bd09b0b719
|
|
@ -367,7 +367,9 @@ func (feeder *clusterStateFeeder) LoadPods() {
|
|||
}
|
||||
feeder.clusterState.AddOrUpdatePod(pod.ID, pod.PodLabels, pod.Phase)
|
||||
for _, container := range pod.Containers {
|
||||
feeder.clusterState.AddOrUpdateContainer(container.ID, container.Request)
|
||||
if err = feeder.clusterState.AddOrUpdateContainer(container.ID, container.Request); err != nil {
|
||||
klog.Warningf("Failed to add container %+v. Reason: %+v", container.ID, err)
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
|
@ -383,6 +385,10 @@ func (feeder *clusterStateFeeder) LoadRealTimeMetrics() {
|
|||
for _, containerMetrics := range containersMetrics {
|
||||
for _, sample := range newContainerUsageSamplesWithKey(containerMetrics) {
|
||||
if err := feeder.clusterState.AddSample(sample); err != nil {
|
||||
// Not all pod states are tracked in memory saver mode
|
||||
if _, isKeyError := err.(model.KeyError); isKeyError && feeder.memorySaveMode {
|
||||
continue
|
||||
}
|
||||
klog.Warningf("Error adding metric sample for container %v: %v", sample.Container, err)
|
||||
droppedSampleCount++
|
||||
} else {
|
||||
|
|
@ -396,7 +402,9 @@ Loop:
|
|||
select {
|
||||
case oomInfo := <-feeder.oomChan:
|
||||
klog.V(3).Infof("OOM detected %+v", oomInfo)
|
||||
feeder.clusterState.RecordOOM(oomInfo.ContainerID, oomInfo.Timestamp, oomInfo.Memory)
|
||||
if err = feeder.clusterState.RecordOOM(oomInfo.ContainerID, oomInfo.Timestamp, oomInfo.Memory); err != nil {
|
||||
klog.Warningf("Failed to record OOM %+v. Reason: %+v", oomInfo, err)
|
||||
}
|
||||
default:
|
||||
break Loop
|
||||
}
|
||||
|
|
|
|||
|
|
@ -155,7 +155,9 @@ func getCappedRecommendation(vpaID model.VpaID, resources logic.RecommendedPodRe
|
|||
func (r *recommender) MaintainCheckpoints(ctx context.Context, minCheckpointsPerRun int) {
|
||||
now := time.Now()
|
||||
if r.useCheckpoints {
|
||||
r.checkpointWriter.StoreCheckpoints(ctx, now, minCheckpointsPerRun)
|
||||
if err := r.checkpointWriter.StoreCheckpoints(ctx, now, minCheckpointsPerRun); err != nil {
|
||||
klog.Warningf("Failed to store checkpoints. Reason: %+v", err)
|
||||
}
|
||||
if time.Now().Sub(r.lastCheckpointGC) > r.checkpointsGCInterval {
|
||||
r.lastCheckpointGC = now
|
||||
r.clusterStateFeeder.GarbageCollectCheckpoints()
|
||||
|
|
|
|||
Loading…
Reference in New Issue