mirror of
https://github.com/vale981/ray
synced 2025-03-12 06:06:39 -04:00

we fixed groupby issue in cuj2; sync the change into nightly test. this test doesn't need to use gpu at all. it returns soon after data ingestion finishes.
96 lines
2.3 KiB
YAML
96 lines
2.3 KiB
YAML
- name: inference
|
|
owner:
|
|
mail: "core@anyscale.com"
|
|
slack: "@Alex Wu"
|
|
|
|
cluster:
|
|
app_config: app_config.yaml
|
|
compute_template: inference.yaml
|
|
|
|
run:
|
|
timeout: 600
|
|
prepare: python wait_cluster.py 2 600
|
|
script: python inference.py
|
|
|
|
- name: shuffle_data_loader
|
|
owner:
|
|
mail: "core@anyscale.com"
|
|
slack: "@Chen Shen"
|
|
|
|
cluster:
|
|
app_config: shuffle_app_config.yaml
|
|
compute_template: shuffle_compute.yaml
|
|
|
|
run:
|
|
timeout: 1800
|
|
script: python dataset_shuffle_data_loader.py
|
|
|
|
- name: pipelined_training_50_gb
|
|
owner:
|
|
mail: "core@anyscale.com"
|
|
slack: "@Chen Shen"
|
|
|
|
cluster:
|
|
app_config: pipelined_training_app.yaml
|
|
compute_template: pipelined_training_compute.yaml
|
|
|
|
run:
|
|
timeout: 4800
|
|
prepare: python wait_cluster.py 15 1200
|
|
script: python pipelined_training.py --epochs 1
|
|
|
|
- name: pipelined_ingestion_1500_gb_15_windows
|
|
owner:
|
|
mail: "core@anyscale.com"
|
|
slack: "@Chen Shen"
|
|
|
|
cluster:
|
|
app_config: pipelined_ingestion_app.yaml
|
|
compute_template: pipelined_ingestion_compute.yaml
|
|
|
|
run:
|
|
timeout: 4800
|
|
prepare: python wait_cluster.py 21 2400
|
|
script: python pipelined_training.py --epochs 2 --num-windows 15 --num-files 915 --debug
|
|
|
|
- name: datasets_ingest_train_infer
|
|
owner:
|
|
mail: "core@anyscale.com"
|
|
slack: "@Chen Shen"
|
|
|
|
cluster:
|
|
app_config: ray_sgd_training_app.yaml
|
|
compute_template: ray_sgd_training_compute.yaml
|
|
|
|
run:
|
|
timeout: 14400
|
|
prepare: python wait_cluster.py 66 2400
|
|
script: python ray_sgd_training.py --address auto --use-s3 --num-workers 16 --use-gpu --large-dataset
|
|
|
|
stable: false
|
|
|
|
smoke_test:
|
|
cluster:
|
|
app_config: ray_sgd_training_app.yaml
|
|
compute_template: ray_sgd_training_smoke_compute.yaml
|
|
|
|
run:
|
|
timeout: 3600
|
|
prepare: python wait_cluster.py 8 2400
|
|
script: python ray_sgd_training.py --address auto --use-s3 --num-workers 8 --use-gpu
|
|
|
|
- name: datasets_preprocess_ingest
|
|
owner:
|
|
mail: "core@anyscale.com"
|
|
slack: "@Chen Shen"
|
|
|
|
cluster:
|
|
app_config: ray_sgd_training_app.yaml
|
|
compute_template: ray_sgd_training_compute_no_gpu.yaml
|
|
|
|
run:
|
|
timeout: 7200
|
|
prepare: python wait_cluster.py 21 2400
|
|
script: python ray_sgd_training.py --address auto --use-s3 --num-workers 16 --use-gpu --large-dataset --debug
|
|
|
|
stable: false
|