forked from llm-d/llm-d-workload-variant-autoscaler
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathhpa.yaml
More file actions
36 lines (36 loc) · 801 Bytes
/
hpa.yaml
File metadata and controls
36 lines (36 loc) · 801 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
apiVersion: autoscaling/v2
kind: HorizontalPodAutoscaler
metadata:
name: sample-deployment-hpa
namespace: llm-d-sim
spec:
scaleTargetRef:
apiVersion: apps/v1
kind: Deployment
name: sample-deployment
# minReplicas: 0 # scale to zero - alpha feature
maxReplicas: 2
behavior:
scaleUp:
stabilizationWindowSeconds: 0
policies:
- type: Pods
value: 10
periodSeconds: 15
scaleDown:
stabilizationWindowSeconds: 0
policies:
- type: Pods
value: 10
periodSeconds: 15
metrics:
- type: External
external:
metric:
name: wva_desired_replicas
selector:
matchLabels:
variant_name: sample-deployment
target:
type: AverageValue
averageValue: "1"