[rllib] replace the assertion in SyncReplayOptimizer by a warning (#4534)

This commit is contained in:
Jones Wong 2019-04-02 01:43:22 -07:00 committed by Eric Liang
parent 60b230b8ad
commit fe7763e786

View file

@ -2,6 +2,7 @@ from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
import logging
import collections
import numpy as np
@ -17,6 +18,8 @@ from ray.rllib.utils.compression import pack_if_needed
from ray.rllib.utils.timer import TimerStat
from ray.rllib.utils.schedules import LinearSchedule
logger = logging.getLogger(__name__)
class SyncReplayOptimizer(PolicyOptimizer):
"""Variant of the local sync optimizer that supports replay (for DQN).
@ -69,7 +72,9 @@ class SyncReplayOptimizer(PolicyOptimizer):
self.replay_buffers = collections.defaultdict(new_buffer)
assert buffer_size >= self.replay_starts
if buffer_size < self.replay_starts:
logger.warning("buffer_size={} < replay_starts={}".format(
buffer_size, self.replay_starts))
@override(PolicyOptimizer)
def step(self):