--- apiVersion: autoscaling/v2 items: - apiVersion: autoscaling/v2 kind: HorizontalPodAutoscaler metadata: annotations: service.beta.openshift.io/serving-cert-secret-name: success-200-isvc-a9320-predictor-serving-cert serving.kserve.io/deploymentMode: Standard creationTimestamp: "2026-04-22T18:04:13Z" labels: app: isvc.success-200-isvc-a9320-predictor component: predictor serving.kserve.io/inferenceservice: success-200-isvc-a9320 managedFields: - apiVersion: autoscaling/v2 fieldsType: FieldsV1 fieldsV1: f:metadata: f:annotations: .: {} f:service.beta.openshift.io/serving-cert-secret-name: {} f:serving.kserve.io/deploymentMode: {} f:labels: .: {} f:app: {} f:component: {} f:serving.kserve.io/inferenceservice: {} f:ownerReferences: .: {} k:{"uid":"7f67703e-a470-4118-ad4e-50cb2096a222"}: {} f:spec: f:behavior: .: {} f:scaleDown: .: {} f:policies: {} f:selectPolicy: {} f:scaleUp: .: {} f:policies: {} f:selectPolicy: {} f:stabilizationWindowSeconds: {} f:maxReplicas: {} f:metrics: {} f:minReplicas: {} f:scaleTargetRef: f:apiVersion: {} f:kind: {} f:name: {} manager: manager operation: Update time: "2026-04-22T18:04:13Z" - apiVersion: autoscaling/v2 fieldsType: FieldsV1 fieldsV1: f:status: f:conditions: .: {} k:{"type":"AbleToScale"}: .: {} f:lastTransitionTime: {} f:message: {} f:reason: {} f:status: {} f:type: {} k:{"type":"ScalingActive"}: .: {} f:lastTransitionTime: {} f:message: {} f:reason: {} f:status: {} f:type: {} k:{"type":"ScalingLimited"}: .: {} f:lastTransitionTime: {} f:message: {} f:reason: {} f:status: {} f:type: {} f:currentMetrics: {} f:currentReplicas: {} f:desiredReplicas: {} manager: kube-controller-manager operation: Update subresource: status time: "2026-04-22T18:05:43Z" name: success-200-isvc-a9320-predictor namespace: kserve-ci-e2e-test ownerReferences: - apiVersion: serving.kserve.io/v1beta1 blockOwnerDeletion: true controller: true kind: InferenceService name: success-200-isvc-a9320 uid: 7f67703e-a470-4118-ad4e-50cb2096a222 resourceVersion: "14561" uid: 9e8eb40a-c67b-4365-aa28-64bfdc2a1ecd spec: behavior: scaleDown: policies: - periodSeconds: 15 type: Percent value: 100 selectPolicy: Max scaleUp: policies: - periodSeconds: 15 type: Pods value: 4 - periodSeconds: 15 type: Percent value: 100 selectPolicy: Max stabilizationWindowSeconds: 0 maxReplicas: 1 metrics: - resource: name: cpu target: averageUtilization: 80 type: Utilization type: Resource minReplicas: 1 scaleTargetRef: apiVersion: apps/v1 kind: Deployment name: success-200-isvc-a9320-predictor status: conditions: - lastTransitionTime: "2026-04-22T18:04:28Z" message: recommended size matches current size reason: ReadyForNewScale status: "True" type: AbleToScale - lastTransitionTime: "2026-04-22T18:05:43Z" message: the HPA was able to successfully calculate a replica count from cpu resource utilization (percentage of request) reason: ValidMetricFound status: "True" type: ScalingActive - lastTransitionTime: "2026-04-22T18:05:43Z" message: the desired count is within the acceptable range reason: DesiredWithinRange status: "False" type: ScalingLimited currentMetrics: - resource: current: averageUtilization: 4 averageValue: 2m name: cpu type: Resource currentReplicas: 1 desiredReplicas: 1 kind: HorizontalPodAutoscalerList metadata: resourceVersion: "39216"