mirror of
https://github.com/vale981/ray
synced 2025-03-06 02:21:39 -05:00

* Add base for Soft Actor-Critic * Pick changes from old SAC branch * Update sac.py * First implementation of sac model * Remove unnecessary SAC imports * Prune unnecessary noise and exploration code * Implement SAC model and use that in SAC policy * runs but doesn't learn * clear state * fix batch size * Add missing alpha grads and vars * -200 by 2k timesteps * doc * lazy squash * one file * ignore tfp * revert done
18 lines
811 B
Docker
18 lines
811 B
Docker
# The examples Docker image adds dependencies needed to run the examples
|
|
|
|
FROM ray-project/deploy
|
|
|
|
# This updates numpy to 1.14 and mutes errors from other libraries
|
|
RUN conda install -y numpy
|
|
RUN apt-get install -y zlib1g-dev
|
|
# The following is needed to support TensorFlow 1.14
|
|
RUN conda remove -y --force wrapt
|
|
RUN pip install gym[atari] opencv-python-headless tensorflow lz4 keras pytest-timeout smart_open tensorflow_probability
|
|
RUN pip install -U h5py # Mutes FutureWarnings
|
|
RUN pip install --upgrade bayesian-optimization
|
|
RUN pip install --upgrade git+git://github.com/hyperopt/hyperopt.git
|
|
RUN pip install --upgrade sigopt
|
|
RUN pip install --upgrade nevergrad
|
|
RUN pip install --upgrade scikit-optimize
|
|
RUN pip install -U pytest-remotedata>=0.3.1
|
|
RUN conda install pytorch-cpu torchvision-cpu -c pytorch
|