ray/examples/hyperopt/driver.py

# Most of the tensorflow code is adapted from Tensorflow's tutorial on using CNNs to train MNIST
# https://www.tensorflow.org/versions/r0.9/tutorials/mnist/pros/index.html#build-a-multilayer-convolutional-network
import numpy as np
import ray
import os

import tensorflow as tf
from tensorflow.examples.tutorials.mnist import input_data

import hyperopt

if __name__ == "__main__":
  ray.init(start_ray_local=True, num_workers=3)

  # The number of sets of random hyperparameters to try.
  trials = 2
  # The number of training passes over the dataset to use for network.
  epochs = 10

  # Load the mnist data and turn the data into remote objects.
  print "Downloading the MNIST dataset. This may take a minute."
  mnist = input_data.read_data_sets("MNIST_data", one_hot=True)
  train_images = ray.put(mnist.train.images)
  train_labels = ray.put(mnist.train.labels)
  validation_images = ray.put(mnist.validation.images)
  validation_labels = ray.put(mnist.validation.labels)

  # Store the best parameters, the best accuracy, and all of the results.
  best_params = None
  best_accuracy = 0
  results = []

  # Randomly generate some hyperparameters, and launch a task for each set.
  for i in range(trials):
    learning_rate = 10 ** np.random.uniform(-5, 5)
    batch_size = np.random.randint(1, 100)
    dropout = np.random.uniform(0, 1)
    stddev = 10 ** np.random.uniform(-5, 5)
    params = {"learning_rate": learning_rate, "batch_size": batch_size, "dropout": dropout, "stddev": stddev}
    results.append((params, hyperopt.train_cnn_and_compute_accuracy.remote(params, epochs, train_images, train_labels, validation_images, validation_labels)))

  # Fetch the results of the tasks and print the results.
  for i in range(trials):
    params, result_id = results[i]
    accuracy = ray.get(result_id)
    print """We achieve accuracy {:.3}% with
        learning_rate: {:.2}
        batch_size: {}
        dropout: {:.2}
        stddev: {:.2}
      """.format(100 * accuracy, params["learning_rate"], params["batch_size"], params["dropout"], params["stddev"])
    if accuracy > best_accuracy:
      best_params = params
      best_accuracy = accuracy

  # Record the best performing set of hyperparameters.
  print """Best accuracy over {} trials was {:.3} with
        learning_rate: {:.2}
        batch_size: {}
        dropout: {:.2}
        stddev: {:.2}
    """.format(trials, 100 * best_accuracy, best_params["learning_rate"], best_params["batch_size"], best_params["dropout"], best_params["stddev"])
update hyperparameter optimization app (#299) 2016-07-26 18:16:10 -07:00			`# Most of the tensorflow code is adapted from Tensorflow's tutorial on using CNNs to train MNIST`
			`# https://www.tensorflow.org/versions/r0.9/tutorials/mnist/pros/index.html#build-a-multilayer-convolutional-network`
Hyperparameter Optimization Code 2016-06-25 00:13:47 +00:00			`import numpy as np`
			`import ray`
			`import os`

update hyperparameter optimization app (#299) 2016-07-26 18:16:10 -07:00			`import tensorflow as tf`
			`from tensorflow.examples.tutorials.mnist import input_data`

			`import hyperopt`

			`if __name__ == "__main__":`
unify starting local cluster with attaching to existing cluster (#327) 2016-07-31 19:26:35 -07:00			`ray.init(start_ray_local=True, num_workers=3)`
update hyperparameter optimization app (#299) 2016-07-26 18:16:10 -07:00
			`# The number of sets of random hyperparameters to try.`
			`trials = 2`
			`# The number of training passes over the dataset to use for network.`
			`epochs = 10`

			`# Load the mnist data and turn the data into remote objects.`
			`print "Downloading the MNIST dataset. This may take a minute."`
			`mnist = input_data.read_data_sets("MNIST_data", one_hot=True)`
			`train_images = ray.put(mnist.train.images)`
			`train_labels = ray.put(mnist.train.labels)`
			`validation_images = ray.put(mnist.validation.images)`
			`validation_labels = ray.put(mnist.validation.labels)`

			`# Store the best parameters, the best accuracy, and all of the results.`
			`best_params = None`
			`best_accuracy = 0`
			`results = []`

			`# Randomly generate some hyperparameters, and launch a task for each set.`
			`for i in range(trials):`
			`learning_rate = 10 ** np.random.uniform(-5, 5)`
			`batch_size = np.random.randint(1, 100)`
			`dropout = np.random.uniform(0, 1)`
			`stddev = 10 ** np.random.uniform(-5, 5)`
			`params = {"learning_rate": learning_rate, "batch_size": batch_size, "dropout": dropout, "stddev": stddev}`
change remote function invocation from func() to func.remote() (#328) 2016-07-31 15:25:19 -07:00			`results.append((params, hyperopt.train_cnn_and_compute_accuracy.remote(params, epochs, train_images, train_labels, validation_images, validation_labels)))`
update hyperparameter optimization app (#299) 2016-07-26 18:16:10 -07:00
			`# Fetch the results of the tasks and print the results.`
			`for i in range(trials):`
Terminology change Object Reference -> Object ID (#330) 2016-07-31 19:58:03 -07:00			`params, result_id = results[i]`
			`accuracy = ray.get(result_id)`
update hyperparameter optimization app (#299) 2016-07-26 18:16:10 -07:00			`print """We achieve accuracy {:.3}% with`
			`learning_rate: {:.2}`
			`batch_size: {}`
			`dropout: {:.2}`
			`stddev: {:.2}`
			`""".format(100 * accuracy, params["learning_rate"], params["batch_size"], params["dropout"], params["stddev"])`
			`if accuracy > best_accuracy:`
			`best_params = params`
			`best_accuracy = accuracy`

			`# Record the best performing set of hyperparameters.`
			`print """Best accuracy over {} trials was {:.3} with`
			`learning_rate: {:.2}`
			`batch_size: {}`
			`dropout: {:.2}`
			`stddev: {:.2}`
			`""".format(trials, 100 * best_accuracy, best_params["learning_rate"], best_params["batch_size"], best_params["dropout"], best_params["stddev"])`