mirror of
https://github.com/vale981/ray
synced 2025-03-06 10:31:39 -05:00
101 lines
2 KiB
YAML
101 lines
2 KiB
YAML
- name: single_deployment_1k_noop_replica
|
|
team: serve
|
|
cluster:
|
|
app_config: app_config.yaml
|
|
compute_template: compute_tpl_32_cpu.yaml
|
|
|
|
run:
|
|
timeout: 7200
|
|
long_running: False
|
|
script: python workloads/single_deployment_1k_noop_replica.py
|
|
|
|
smoke_test:
|
|
timeout: 600
|
|
|
|
- name: multi_deployment_1k_noop_replica
|
|
team: serve
|
|
cluster:
|
|
app_config: app_config.yaml
|
|
compute_template: compute_tpl_32_cpu.yaml
|
|
|
|
run:
|
|
timeout: 7200
|
|
long_running: False
|
|
script: python workloads/multi_deployment_1k_noop_replica.py
|
|
|
|
smoke_test:
|
|
timeout: 600
|
|
|
|
- name: autoscaling_single_deployment
|
|
team: serve
|
|
cluster:
|
|
app_config: app_config.yaml
|
|
compute_template: compute_tpl_8_cpu_autoscaling.yaml
|
|
|
|
run:
|
|
timeout: 7200
|
|
long_running: False
|
|
script: python workloads/autoscaling_single_deployment.py
|
|
|
|
smoke_test:
|
|
timeout: 600
|
|
|
|
- name: autoscaling_multi_deployment
|
|
team: serve
|
|
cluster:
|
|
app_config: app_config.yaml
|
|
compute_template: compute_tpl_8_cpu_autoscaling.yaml
|
|
|
|
run:
|
|
timeout: 7200
|
|
long_running: False
|
|
script: python workloads/autoscaling_multi_deployment.py
|
|
|
|
smoke_test:
|
|
timeout: 600
|
|
|
|
- name: serve_micro_benchmark
|
|
team: serve
|
|
cluster:
|
|
app_config: app_config.yaml
|
|
# 16 CPUS
|
|
compute_template: compute_tpl_single_node.yaml
|
|
|
|
run:
|
|
timeout: 7200
|
|
long_running: False
|
|
script: python workloads/serve_micro_benchmark.py
|
|
|
|
smoke_test:
|
|
timeout: 600
|
|
|
|
- name: serve_micro_benchmark_k8s
|
|
team: serve
|
|
cluster:
|
|
app_config: app_config.yaml
|
|
# 16 CPUS
|
|
compute_template: compute_tpl_single_node_k8s.yaml
|
|
compute_on_k8s: True
|
|
|
|
run:
|
|
timeout: 7200
|
|
long_running: False
|
|
script: python workloads/serve_micro_benchmark.py
|
|
|
|
smoke_test:
|
|
timeout: 600
|
|
|
|
- name: serve_cluster_fault_tolerance
|
|
team: serve
|
|
cluster:
|
|
app_config: app_config.yaml
|
|
# 16 CPUS
|
|
compute_template: compute_tpl_single_node.yaml
|
|
|
|
run:
|
|
timeout: 7200
|
|
long_running: False
|
|
script: python workloads/serve_cluster_fault_tolerance.py
|
|
|
|
smoke_test:
|
|
timeout: 600
|