mercari · randytqwjp · Dec 20, 2024 · Dec 20, 2024 · Dec 23, 2024 · Dec 25, 2024
@@ -70,15 +70,15 @@ status:
       type: ScaledUpBasedOnPreferredMaxReplicas
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: HPA target utilization is updated
-      reason: HPATargetUtilizationUpdated
+      message: The recommendation is provided
       status: "True"
-      type: HPATargetUtilizationUpdated
+      type: VerticalRecommendationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: The recommendation is provided
+      message: HPA target utilization is updated
+      reason: HPATargetUtilizationUpdated
       status: "True"
-      type: VerticalRecommendationUpdated
+      type: HPATargetUtilizationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
       status: "False"

@@ -70,15 +70,15 @@ status:
       type: ScaledUpBasedOnPreferredMaxReplicas
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: HPA target utilization is updated
-      reason: HPATargetUtilizationUpdated
+      message: The recommendation is provided
       status: "True"
-      type: HPATargetUtilizationUpdated
+      type: VerticalRecommendationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: The recommendation is provided
+      message: HPA target utilization is updated
+      reason: HPATargetUtilizationUpdated
       status: "True"
-      type: VerticalRecommendationUpdated
+      type: HPATargetUtilizationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
       status: "False"

@@ -70,15 +70,15 @@ status:
       type: ScaledUpBasedOnPreferredMaxReplicas
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: HPA target utilization is updated
-      reason: HPATargetUtilizationUpdated
+      message: The recommendation is provided
       status: "True"
-      type: HPATargetUtilizationUpdated
+      type: VerticalRecommendationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: The recommendation is provided
+      message: HPA target utilization is updated
+      reason: HPATargetUtilizationUpdated
       status: "True"
-      type: VerticalRecommendationUpdated
+      type: HPATargetUtilizationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
       status: "False"

@@ -70,15 +70,15 @@ status:
       type: ScaledUpBasedOnPreferredMaxReplicas
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: HPA target utilization is updated
-      reason: HPATargetUtilizationUpdated
+      message: The recommendation is provided
       status: "True"
-      type: HPATargetUtilizationUpdated
+      type: VerticalRecommendationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: The recommendation is provided
+      message: HPA target utilization is updated
+      reason: HPATargetUtilizationUpdated
       status: "True"
-      type: VerticalRecommendationUpdated
+      type: HPATargetUtilizationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
       status: "False"

@@ -70,15 +70,15 @@ status:
       type: ScaledUpBasedOnPreferredMaxReplicas
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: HPA target utilization is updated
-      reason: HPATargetUtilizationUpdated
+      message: The recommendation is provided
       status: "True"
-      type: HPATargetUtilizationUpdated
+      type: VerticalRecommendationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: The recommendation is provided
+      message: HPA target utilization is updated
+      reason: HPATargetUtilizationUpdated
       status: "True"
-      type: VerticalRecommendationUpdated
+      type: HPATargetUtilizationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
       status: "False"

@@ -47,15 +47,15 @@ status:
       type: ScaledUpBasedOnPreferredMaxReplicas
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: HPA target utilization is updated
-      reason: HPATargetUtilizationUpdated
+      message: The recommendation is provided
       status: "True"
-      type: HPATargetUtilizationUpdated
+      type: VerticalRecommendationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: The recommendation is provided
+      message: HPA target utilization is updated
+      reason: HPATargetUtilizationUpdated
       status: "True"
-      type: VerticalRecommendationUpdated
+      type: HPATargetUtilizationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
       status: "False"

@@ -53,15 +53,15 @@ status:
       type: ScaledUpBasedOnPreferredMaxReplicas
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: HPA target utilization is updated
-      reason: HPATargetUtilizationUpdated
+      message: The recommendation is provided
       status: "True"
-      type: HPATargetUtilizationUpdated
+      type: VerticalRecommendationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: The recommendation is provided
+      message: HPA target utilization is updated
+      reason: HPATargetUtilizationUpdated
       status: "True"
-      type: VerticalRecommendationUpdated
+      type: HPATargetUtilizationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
       status: "False"

@@ -47,15 +47,15 @@ status:
       type: ScaledUpBasedOnPreferredMaxReplicas
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: HPA target utilization is updated
-      reason: HPATargetUtilizationUpdated
+      message: The recommendation is provided
       status: "True"
-      type: HPATargetUtilizationUpdated
+      type: VerticalRecommendationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
-      message: The recommendation is provided
+      message: HPA target utilization is updated
+      reason: HPATargetUtilizationUpdated
       status: "True"
-      type: VerticalRecommendationUpdated
+      type: HPATargetUtilizationUpdated
     - lastTransitionTime: "2023-01-01T00:00:00Z"
       lastUpdateTime: "2023-01-01T00:00:00Z"
       status: "False"

@@ -258,15 +258,15 @@ func (r *TortoiseReconciler) Reconcile(ctx context.Context, req ctrl.Request) (_
 		return ctrl.Result{RequeueAfter: r.Interval}, nil
 	}
 
-	_, tortoise, err = r.HpaService.UpdateHPAFromTortoiseRecommendation(ctx, tortoise, now)
+	tortoise, err = r.TortoiseService.UpdateResourceRequest(ctx, tortoise, currentDesiredReplicaNum, now)
 	if err != nil {
-		logger.Error(err, "update HPA based on the recommendation in tortoise", "tortoise", req.NamespacedName)
+		logger.Error(err, "update VPA based on the recommendation in tortoise", "tortoise", req.NamespacedName)
 		return ctrl.Result{}, err
 	}
 
-	tortoise, err = r.TortoiseService.UpdateResourceRequest(ctx, tortoise, currentDesiredReplicaNum, now)
+	_, tortoise, err = r.HpaService.UpdateHPAFromTortoiseRecommendation(ctx, tortoise, now)
 	if err != nil {
-		logger.Error(err, "update VPA based on the recommendation in tortoise", "tortoise", req.NamespacedName)
+		logger.Error(err, "update HPA based on the recommendation in tortoise", "tortoise", req.NamespacedName)
 		return ctrl.Result{}, err
 	}
 

@@ -405,6 +405,7 @@ func (c *Service) ChangeHPAFromTortoiseRecommendation(tortoise *autoscalingv1bet
 		recommendMax = c.maximumMaxReplica
 	}
 
+	oldMax := hpa.Spec.MaxReplicas
 	hpa.Spec.MaxReplicas = recommendMax
 
 	recommendMin, err := GetReplicasRecommendation(tortoise.Status.Recommendations.Horizontal.MinReplicas, now)
@@ -443,19 +444,33 @@ func (c *Service) ChangeHPAFromTortoiseRecommendation(tortoise *autoscalingv1bet
 		minToActuallyApply = recommendMin
 	}
 
+	oldMin := *hpa.Spec.MinReplicas
 	hpa.Spec.MinReplicas = &minToActuallyApply
 	if tortoise.Spec.UpdateMode != autoscalingv1beta3.UpdateModeOff && recordMetrics {
 		// We don't want to record applied* metric when UpdateMode is Off.
-		netChangeMaxReplicas := float64(hpa.Spec.MaxReplicas - recommendMax)
-		netChangeMinReplicas := float64(*hpa.Spec.MinReplicas) - float64(recommendMin)
-		if netChangeMaxReplicas > 0 || netChangeMinReplicas < 0 {
-			metrics.IncreaseApplyCounter.WithLabelValues(tortoise.Name, tortoise.Namespace).Add(1)
-		}
-		if netChangeMaxReplicas < 0 || netChangeMinReplicas > 0 {
-			metrics.DecreaseApplyCounter.WithLabelValues(tortoise.Name, tortoise.Namespace).Add(1)
+		netChangeMaxReplicas := float64(recommendMax - oldMax)
+		netChangeMinReplicas := float64(recommendMin - oldMin)
+		cpu := float64(0)
+		mem := float64(0)
+		for _, r := range tortoise.Status.Conditions.ContainerResourceRequests {
+			for resourcename, value := range r.Resource {
+				if resourcename == corev1.ResourceCPU {
+					cpu += value.AsApproximateFloat64()
+				}
+				if resourcename == corev1.ResourceMemory {
+					mem += value.AsApproximateFloat64()
+				}
+			}
 		}
-		metrics.NetHPAMinReplicas.WithLabelValues(tortoise.Name, tortoise.Namespace, hpa.Name, tortoise.Spec.TargetRefs.ScaleTargetRef.Name).Set(netChangeMinReplicas)
-		metrics.NetHPAMaxReplicas.WithLabelValues(tortoise.Name, tortoise.Namespace, hpa.Name, tortoise.Spec.TargetRefs.ScaleTargetRef.Name).Set(netChangeMaxReplicas)
+		netChangeMaxReplicasCpu := netChangeMaxReplicas * cpu
+		netChangeMinReplicasCpu := netChangeMinReplicas * cpu
+		netChangeMinReplicasMem := netChangeMinReplicas * mem
+		netChangeMaxReplicasMem := netChangeMaxReplicas * mem
+
+		metrics.NetHPAMinReplicasCPUCores.WithLabelValues(tortoise.Name, tortoise.Namespace, hpa.Name).Set(netChangeMinReplicasCpu)
+		metrics.NetHPAMaxReplicasCPUCores.WithLabelValues(tortoise.Name, tortoise.Namespace, hpa.Name).Set(netChangeMaxReplicasCpu)
+		metrics.NetHPAMinReplicasMemory.WithLabelValues(tortoise.Name, tortoise.Namespace, hpa.Name).Set(netChangeMinReplicasMem)
+		metrics.NetHPAMaxReplicasMemory.WithLabelValues(tortoise.Name, tortoise.Namespace, hpa.Name).Set(netChangeMaxReplicasMem)
 		metrics.AppliedHPAMinReplicas.WithLabelValues(tortoise.Name, tortoise.Namespace, hpa.Name).Set(float64(*hpa.Spec.MinReplicas))
 		metrics.AppliedHPAMaxReplicas.WithLabelValues(tortoise.Name, tortoise.Namespace, hpa.Name).Set(float64(hpa.Spec.MaxReplicas))
 	}

@@ -46,25 +46,25 @@ var (
 		Help: "memory request (byte) that tortoises actually applys",
 	}, []string{"tortoise_name", "namespace", "container_name", "controller_name", "controller_kind"})
 
-	DecreaseApplyCounter = prometheus.NewCounterVec(prometheus.CounterOpts{
-		Name: "decrease_apply_counter",
-		Help: "counter for number of resource decreases applied by tortoise",
-	}, []string{"tortoise_name", "namespace"})
-
-	IncreaseApplyCounter = prometheus.NewCounterVec(prometheus.CounterOpts{
-		Name: "increase_apply_counter",
-		Help: "counter for number of resource increases applied by tortoise",
-	}, []string{"tortoise_name", "namespace"})
-
-	NetHPAMinReplicas = prometheus.NewGaugeVec(prometheus.GaugeOpts{
-		Name: "net_hpa_minreplicas",
-		Help: "net hpa minReplicas that tortoises actually applys to hpa",
-	}, []string{"tortoise_name", "namespace", "hpa_name", "kube_deployment"})
-
-	NetHPAMaxReplicas = prometheus.NewGaugeVec(prometheus.GaugeOpts{
-		Name: "net_hpa_maxreplicas",
-		Help: "net hpa maxReplicas that tortoises actually applys to hpa",
-	}, []string{"tortoise_name", "namespace", "hpa_name", "kube_deployment"})
+	NetHPAMinReplicasCPUCores = prometheus.NewGaugeVec(prometheus.GaugeOpts{
+		Name: "net_hpa_minreplicas_cpu_cores",
+		Help: "net cpu cores changed by minReplicas that tortoises actually applys to hpa",
+	}, []string{"tortoise_name", "namespace", "hpa_name"})
+
+	NetHPAMinReplicasMemory = prometheus.NewGaugeVec(prometheus.GaugeOpts{
+		Name: "net_hpa_minreplicas_memory",
+		Help: "net memory changed by minReplicas that tortoises actually applys to hpa",
+	}, []string{"tortoise_name", "namespace", "hpa_name"})
+
+	NetHPAMaxReplicasCPUCores = prometheus.NewGaugeVec(prometheus.GaugeOpts{
+		Name: "net_hpa_maxreplicas_cpu_cores",
+		Help: "net cpu cores changed by maxReplicas that tortoises actually applys to hpa",
+	}, []string{"tortoise_name", "namespace", "hpa_name"})
+
+	NetHPAMaxReplicasMemory = prometheus.NewGaugeVec(prometheus.GaugeOpts{
+		Name: "net_hpa_maxreplicas_memory",
+		Help: "net memory changed by maxReplicas that tortoises actually applys to hpa",
+	}, []string{"tortoise_name", "namespace", "hpa_name"})
 
 	NetCPURequest = prometheus.NewGaugeVec(prometheus.GaugeOpts{
 		Name: "net_cpu_request",
@@ -117,10 +117,10 @@ func init() {
 		AppliedHPAMinReplicas,
 		AppliedCPURequest,
 		AppliedMemoryRequest,
-		IncreaseApplyCounter,
-		DecreaseApplyCounter,
-		NetHPAMaxReplicas,
-		NetHPAMinReplicas,
+		NetHPAMinReplicasCPUCores,
+		NetHPAMinReplicasMemory,
+		NetHPAMaxReplicasCPUCores,
+		NetHPAMaxReplicasMemory,
 		NetCPURequest,
 		NetMemoryRequest,
 		ProposedHPATargetUtilization,

@@ -768,21 +768,15 @@ func (c *Service) UpdateResourceRequest(ctx context.Context, tortoise *v1beta3.T
 		// only record metrics once in every reconcile loop.
 		for resourcename, value := range r.Resource {
 			oldRequest := oldRequestMap[r.ContainerName][resourcename]
-			netChange := float64(oldRequest.MilliValue() - value.MilliValue())
+			netChange := float64(oldRequest.MilliValue()-value.MilliValue()) * float64(replica)
 			if resourcename == corev1.ResourceCPU {
 				// We don't want to record applied* metric when UpdateMode is Off.
 				metrics.AppliedCPURequest.WithLabelValues(tortoise.Name, tortoise.Namespace, r.ContainerName, tortoise.Spec.TargetRefs.ScaleTargetRef.Name, tortoise.Spec.TargetRefs.ScaleTargetRef.Kind).Set(float64(value.MilliValue()))
 				metrics.NetCPURequest.WithLabelValues(tortoise.Name, tortoise.Namespace, r.ContainerName, tortoise.Spec.TargetRefs.ScaleTargetRef.Name, tortoise.Spec.TargetRefs.ScaleTargetRef.Kind).Set(netChange)
 			}
 			if resourcename == corev1.ResourceMemory {
 				metrics.AppliedMemoryRequest.WithLabelValues(tortoise.Name, tortoise.Namespace, r.ContainerName, tortoise.Spec.TargetRefs.ScaleTargetRef.Name, tortoise.Spec.TargetRefs.ScaleTargetRef.Kind).Set(float64(value.Value()))
-				metrics.NetMemoryRequest.WithLabelValues(tortoise.Name, tortoise.Namespace, r.ContainerName, tortoise.Spec.TargetRefs.ScaleTargetRef.Name, tortoise.Spec.TargetRefs.ScaleTargetRef.Kind).Set(float64(netChange))
-			}
-			if netChange > 0 {
-				metrics.IncreaseApplyCounter.WithLabelValues(tortoise.Name, tortoise.Namespace).Add(1)
-			}
-			if netChange < 0 {
-				metrics.DecreaseApplyCounter.WithLabelValues(tortoise.Name, tortoise.Namespace).Add(1)
+				metrics.NetMemoryRequest.WithLabelValues(tortoise.Name, tortoise.Namespace, r.ContainerName, tortoise.Spec.TargetRefs.ScaleTargetRef.Name, tortoise.Spec.TargetRefs.ScaleTargetRef.Kind).Set(netChange / float64(1000))
 			}
 		}
 	}