--- apiVersion: autoscaling/v2 items: - apiVersion: autoscaling/v2 kind: HorizontalPodAutoscaler metadata: annotations: internal.serving.kserve.io/batcher: "true" internal.serving.kserve.io/batcher-max-batchsize: "32" internal.serving.kserve.io/batcher-max-latency: "5000" internal.serving.kserve.io/storage-initializer-sourceuri: gs://kfserving-examples/models/sklearn/1.0/model prometheus.kserve.io/path: /metrics prometheus.kserve.io/port: "8080" service.beta.openshift.io/serving-cert-secret-name: isvc-raw-sklearn-batcher-ccfea-predictor-serving-cert serving.kserve.io/deploymentMode: Standard creationTimestamp: "2026-04-22T18:44:39Z" labels: app: isvc.isvc-raw-sklearn-batcher-ccfea-predictor component: predictor networking.kserve.io/visibility: exposed serving.kserve.io/inferenceservice: isvc-raw-sklearn-batcher-ccfea managedFields: - apiVersion: autoscaling/v2 fieldsType: FieldsV1 fieldsV1: f:metadata: f:annotations: .: {} f:internal.serving.kserve.io/batcher: {} f:internal.serving.kserve.io/batcher-max-batchsize: {} f:internal.serving.kserve.io/batcher-max-latency: {} f:internal.serving.kserve.io/storage-initializer-sourceuri: {} f:prometheus.kserve.io/path: {} f:prometheus.kserve.io/port: {} f:service.beta.openshift.io/serving-cert-secret-name: {} f:serving.kserve.io/deploymentMode: {} f:labels: .: {} f:app: {} f:component: {} f:networking.kserve.io/visibility: {} f:serving.kserve.io/inferenceservice: {} f:ownerReferences: .: {} k:{"uid":"625f01ea-5558-4b8b-ad2b-9a2fb95a8d7f"}: {} f:spec: f:behavior: .: {} f:scaleDown: .: {} f:policies: {} f:selectPolicy: {} f:scaleUp: .: {} f:policies: {} f:selectPolicy: {} f:stabilizationWindowSeconds: {} f:maxReplicas: {} f:metrics: {} f:minReplicas: {} f:scaleTargetRef: f:apiVersion: {} f:kind: {} f:name: {} manager: manager operation: Update time: "2026-04-22T18:44:39Z" - apiVersion: autoscaling/v2 fieldsType: FieldsV1 fieldsV1: f:status: f:conditions: .: {} k:{"type":"AbleToScale"}: .: {} f:lastTransitionTime: {} f:message: {} f:reason: {} f:status: {} f:type: {} k:{"type":"ScalingActive"}: .: {} f:lastTransitionTime: {} f:message: {} f:reason: {} f:status: {} f:type: {} k:{"type":"ScalingLimited"}: .: {} f:lastTransitionTime: {} f:message: {} f:reason: {} f:status: {} f:type: {} f:currentMetrics: {} f:currentReplicas: {} f:desiredReplicas: {} manager: kube-controller-manager operation: Update subresource: status time: "2026-04-22T20:08:00Z" name: isvc-raw-sklearn-batcher-ccfea-predictor namespace: kserve-ci-e2e-test ownerReferences: - apiVersion: serving.kserve.io/v1beta1 blockOwnerDeletion: true controller: true kind: InferenceService name: isvc-raw-sklearn-batcher-ccfea uid: 625f01ea-5558-4b8b-ad2b-9a2fb95a8d7f resourceVersion: "48046" uid: 5fccaec4-4554-49e6-9ea0-83b2a5a2fd24 spec: behavior: scaleDown: policies: - periodSeconds: 15 type: Percent value: 100 selectPolicy: Max scaleUp: policies: - periodSeconds: 15 type: Pods value: 4 - periodSeconds: 15 type: Percent value: 100 selectPolicy: Max stabilizationWindowSeconds: 0 maxReplicas: 1 metrics: - resource: name: cpu target: averageUtilization: 80 type: Utilization type: Resource minReplicas: 1 scaleTargetRef: apiVersion: apps/v1 kind: Deployment name: isvc-raw-sklearn-batcher-ccfea-predictor status: conditions: - lastTransitionTime: "2026-04-22T18:44:54Z" message: recommended size matches current size reason: ReadyForNewScale status: "True" type: AbleToScale - lastTransitionTime: "2026-04-22T18:46:54Z" message: the HPA was able to successfully calculate a replica count from cpu resource utilization (percentage of request) reason: ValidMetricFound status: "True" type: ScalingActive - lastTransitionTime: "2026-04-22T18:46:54Z" message: the desired count is within the acceptable range reason: DesiredWithinRange status: "False" type: ScalingLimited currentMetrics: - resource: current: averageUtilization: 12 averageValue: 18m name: cpu type: Resource currentReplicas: 1 desiredReplicas: 1 kind: HorizontalPodAutoscalerList metadata: resourceVersion: "48100"