diff --git a/functions/scaling/sleep-py-concurrency.yml b/functions/scaling/sleep-py-concurrency.yml new file mode 100644 index 0000000..0becd88 --- /dev/null +++ b/functions/scaling/sleep-py-concurrency.yml @@ -0,0 +1,21 @@ +apiVersion: serving.knative.dev/v1alpha1 +kind: Service +metadata: + name: sleep-py-sc + namespace: default +spec: + template: + metadata: + annotations: + # Knative concurrency-based autoscaling (default). + autoscaling.knative.dev/class: kpa.autoscaling.knative.dev + autoscaling.knative.dev/metric: concurrency + # Target 10 requests in-flight per pod. + autoscaling.knative.dev/target: "10" + # Disable scale to zero with a minScale of 1. + autoscaling.knative.dev/minScale: "1" + # Limit scaling to 100 pods. + autoscaling.knative.dev/maxScale: "100" + spec: + containers: + - image: tormachris/sleep-python