mirror of
https://github.com/openshift/openshift-docs.git
synced 2026-02-05 21:46:22 +01:00
28 lines
1.2 KiB
Plaintext
28 lines
1.2 KiB
Plaintext
// Module included in the following assemblies:
|
|
//
|
|
// * serverless/develop/serverless-autoscaling-developer.adoc
|
|
|
|
:_content-type: REFERENCE
|
|
[id="serverless-target-utilization_{context}"]
|
|
= Concurrency target utilization
|
|
|
|
This value specifies the percentage of the concurrency limit that is actually targeted by the autoscaler. This is also known as specifying the _hotness_ at which a replica runs, which enables the autoscaler to scale up before the defined hard limit is reached.
|
|
|
|
For example, if the `containerConcurrency` value is set to 10, and the `target-utilization-percentage` value is set to 70 percent, the autoscaler creates a new replica when the average number of concurrent requests across all existing replicas reaches 7. Requests numbered 7 to 10 are still sent to the existing replicas, but additional replicas are started in anticipation of being required after the `containerConcurrency` value is reached.
|
|
|
|
.Example service configured using the target-utilization-percentage annotation
|
|
[source,yaml]
|
|
----
|
|
apiVersion: serving.knative.dev/v1
|
|
kind: Service
|
|
metadata:
|
|
name: example-service
|
|
namespace: default
|
|
spec:
|
|
template:
|
|
metadata:
|
|
annotations:
|
|
autoscaling.knative.dev/target-utilization-percentage: "70"
|
|
...
|
|
----
|