ray/release/nightly_tests/dataset/dataset_test.yaml
Chen Shen 6d17fe5fc5
[cuj2] merge latest change to cuj2 (groupby based filtering) and add a debug mode. (#20742)
This PR does two things:

merge latest groupby based filtering to CUJ2
add a debug mode so we only run dummy trainer for measure data processing performance.
2021-11-29 19:10:17 -08:00

96 lines
2.3 KiB
YAML

- name: inference
owner:
mail: "core@anyscale.com"
slack: "@Alex Wu"
cluster:
app_config: app_config.yaml
compute_template: inference.yaml
run:
timeout: 600
prepare: python wait_cluster.py 2 600
script: python inference.py
- name: shuffle_data_loader
owner:
mail: "core@anyscale.com"
slack: "@Chen Shen"
cluster:
app_config: shuffle_app_config.yaml
compute_template: shuffle_compute.yaml
run:
timeout: 1800
script: python dataset_shuffle_data_loader.py
- name: pipelined_training_50_gb
owner:
mail: "core@anyscale.com"
slack: "@Chen Shen"
cluster:
app_config: pipelined_training_app.yaml
compute_template: pipelined_training_compute.yaml
run:
timeout: 4800
prepare: python wait_cluster.py 15 1200
script: python pipelined_training.py --epochs 1
- name: pipelined_ingestion_1500_gb_15_windows
owner:
mail: "core@anyscale.com"
slack: "@Chen Shen"
cluster:
app_config: pipelined_ingestion_app.yaml
compute_template: pipelined_ingestion_compute.yaml
run:
timeout: 4800
prepare: python wait_cluster.py 21 2400
script: python pipelined_training.py --epochs 2 --num-windows 15 --num-files 915 --debug
- name: datasets_ingest_train_infer
owner:
mail: "core@anyscale.com"
slack: "@Chen Shen"
cluster:
app_config: ray_sgd_training_app.yaml
compute_template: ray_sgd_training_compute.yaml
run:
timeout: 14400
prepare: python wait_cluster.py 66 2400
script: python ray_sgd_training.py --address auto --use-s3 --num-workers 16 --use-gpu --large-dataset
stable: false
smoke_test:
cluster:
app_config: ray_sgd_training_app.yaml
compute_template: ray_sgd_training_smoke_compute.yaml
run:
timeout: 3600
prepare: python wait_cluster.py 8 2400
script: python ray_sgd_training.py --address auto --use-s3 --num-workers 8 --use-gpu
- name: datasets_preprocess_ingest
owner:
mail: "core@anyscale.com"
slack: "@Chen Shen"
cluster:
app_config: ray_sgd_training_app.yaml
compute_template: ray_sgd_training_compute.yaml
run:
timeout: 14400
prepare: python wait_cluster.py 66 2400
script: python ray_sgd_training.py --address auto --use-s3 --num-workers 16 --use-gpu --large-dataset --debug
stable: false