ray/release/nightly_tests/dataset/dataset_test.yaml

- name: inference
  owner:
    mail: "core@anyscale.com"
    slack: "@Alex Wu"

  cluster:
    app_config: app_config.yaml
    compute_template: inference.yaml

  run:
    timeout: 600
    prepare: python wait_cluster.py 2 600
    script: python inference.py

- name: shuffle_data_loader
  owner:
    mail: "core@anyscale.com"
    slack: "@Chen Shen"

  cluster:
    app_config: shuffle_app_config.yaml
    compute_template: shuffle_compute.yaml

  run:
    timeout: 1800
    script: python dataset_shuffle_data_loader.py

- name: pipelined_training_50_gb
  owner:
    mail: "core@anyscale.com"
    slack: "@Chen Shen"

  cluster:
    app_config: pipelined_training_app.yaml
    compute_template: pipelined_training_compute.yaml

  run:
    timeout: 4800
    prepare: python wait_cluster.py 15 1200
    script: python pipelined_training.py --epochs 1

- name: pipelined_ingestion_1500_gb_15_windows
  owner:
    mail: "core@anyscale.com"
    slack: "@Chen Shen"

  cluster:
    app_config: pipelined_ingestion_app.yaml
    compute_template: pipelined_ingestion_compute.yaml

  run:
    timeout: 4800
    prepare: python wait_cluster.py 21 2400
    script: python pipelined_training.py --epochs 2 --num-windows 15  --num-files 915 --debug

- name: datasets_ingest_train_infer
  owner:
    mail: "core@anyscale.com"
    slack: "@Chen Shen"

  cluster:
    app_config: ray_sgd_training_app.yaml
    compute_template: ray_sgd_training_compute.yaml

  run:
    timeout: 14400
    prepare: python wait_cluster.py 66 2400
    script: python ray_sgd_training.py --address auto --use-s3 --num-workers 16 --use-gpu --large-dataset

  stable: false

  smoke_test:
    cluster:
      app_config: ray_sgd_training_app.yaml
      compute_template: ray_sgd_training_smoke_compute.yaml

    run:
      timeout: 3600
      prepare: python wait_cluster.py 8 2400
      script: python ray_sgd_training.py --address auto --use-s3 --num-workers 8 --use-gpu

- name: datasets_preprocess_ingest
  owner:
    mail: "core@anyscale.com"
    slack: "@Chen Shen"

  cluster:
    app_config: ray_sgd_training_app.yaml
    compute_template: ray_sgd_training_compute.yaml

  run:
    timeout: 14400
    prepare: python wait_cluster.py 66 2400
    script: python ray_sgd_training.py --address auto --use-s3 --num-workers 16 --use-gpu --large-dataset --debug

  stable: false