--- apiVersion: autoscaling/v2 items: - apiVersion: autoscaling/v2 kind: HorizontalPodAutoscaler metadata: annotations: internal.serving.kserve.io/batcher: "true" internal.serving.kserve.io/batcher-max-batchsize: "32" internal.serving.kserve.io/batcher-max-latency: "5000" internal.serving.kserve.io/storage-initializer-sourceuri: gs://kfserving-examples/models/sklearn/1.0/model prometheus.kserve.io/path: /metrics prometheus.kserve.io/port: "8080" service.beta.openshift.io/serving-cert-secret-name: isvc-raw-sklearn-batcher-1df94-predictor-serving-cert serving.kserve.io/deploymentMode: Standard creationTimestamp: "2026-04-22T17:41:28Z" labels: app: isvc.isvc-raw-sklearn-batcher-1df94-predictor component: predictor networking.kserve.io/visibility: exposed serving.kserve.io/inferenceservice: isvc-raw-sklearn-batcher-1df94 managedFields: - apiVersion: autoscaling/v2 fieldsType: FieldsV1 fieldsV1: f:metadata: f:annotations: .: {} f:internal.serving.kserve.io/batcher: {} f:internal.serving.kserve.io/batcher-max-batchsize: {} f:internal.serving.kserve.io/batcher-max-latency: {} f:internal.serving.kserve.io/storage-initializer-sourceuri: {} f:prometheus.kserve.io/path: {} f:prometheus.kserve.io/port: {} f:service.beta.openshift.io/serving-cert-secret-name: {} f:serving.kserve.io/deploymentMode: {} f:labels: .: {} f:app: {} f:component: {} f:networking.kserve.io/visibility: {} f:serving.kserve.io/inferenceservice: {} f:ownerReferences: .: {} k:{"uid":"871dda5c-e02e-4773-8dc4-13e8375a0138"}: {} f:spec: f:behavior: .: {} f:scaleDown: .: {} f:policies: {} f:selectPolicy: {} f:scaleUp: .: {} f:policies: {} f:selectPolicy: {} f:stabilizationWindowSeconds: {} f:maxReplicas: {} f:metrics: {} f:minReplicas: {} f:scaleTargetRef: f:apiVersion: {} f:kind: {} f:name: {} manager: manager operation: Update time: "2026-04-22T17:41:28Z" - apiVersion: autoscaling/v2 fieldsType: FieldsV1 fieldsV1: f:status: f:conditions: .: {} k:{"type":"AbleToScale"}: .: {} f:lastTransitionTime: {} f:message: {} f:reason: {} f:status: {} f:type: {} k:{"type":"ScalingActive"}: .: {} f:lastTransitionTime: {} f:message: {} f:reason: {} f:status: {} f:type: {} k:{"type":"ScalingLimited"}: .: {} f:lastTransitionTime: {} f:message: {} f:reason: {} f:status: {} f:type: {} f:currentMetrics: {} f:currentReplicas: {} f:desiredReplicas: {} manager: kube-controller-manager operation: Update subresource: status time: "2026-04-22T19:04:19Z" name: isvc-raw-sklearn-batcher-1df94-predictor namespace: kserve-ci-e2e-test ownerReferences: - apiVersion: serving.kserve.io/v1beta1 blockOwnerDeletion: true controller: true kind: InferenceService name: isvc-raw-sklearn-batcher-1df94 uid: 871dda5c-e02e-4773-8dc4-13e8375a0138 resourceVersion: "47562" uid: 40d005f7-b142-4b8c-ae80-ab8d5484474b spec: behavior: scaleDown: policies: - periodSeconds: 15 type: Percent value: 100 selectPolicy: Max scaleUp: policies: - periodSeconds: 15 type: Pods value: 4 - periodSeconds: 15 type: Percent value: 100 selectPolicy: Max stabilizationWindowSeconds: 0 maxReplicas: 1 metrics: - resource: name: cpu target: averageUtilization: 80 type: Utilization type: Resource minReplicas: 1 scaleTargetRef: apiVersion: apps/v1 kind: Deployment name: isvc-raw-sklearn-batcher-1df94-predictor status: conditions: - lastTransitionTime: "2026-04-22T17:41:43Z" message: recommended size matches current size reason: ReadyForNewScale status: "True" type: AbleToScale - lastTransitionTime: "2026-04-22T17:43:59Z" message: the HPA was able to successfully calculate a replica count from cpu resource utilization (percentage of request) reason: ValidMetricFound status: "True" type: ScalingActive - lastTransitionTime: "2026-04-22T17:43:59Z" message: the desired count is within the acceptable range reason: DesiredWithinRange status: "False" type: ScalingLimited currentMetrics: - resource: current: averageUtilization: 12 averageValue: 19m name: cpu type: Resource currentReplicas: 1 desiredReplicas: 1 kind: HorizontalPodAutoscalerList metadata: resourceVersion: "47868"