2019-02-13 16:25:05 -08:00
|
|
|
import logging
|
|
|
|
import random
|
|
|
|
|
|
|
|
from ray.rllib.offline.input_reader import InputReader
|
|
|
|
from ray.rllib.utils.annotations import override, DeveloperAPI
|
2020-08-15 13:24:22 +02:00
|
|
|
from ray.rllib.utils.typing import SampleBatchType
|
2019-02-13 16:25:05 -08:00
|
|
|
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
|
|
|
@DeveloperAPI
|
|
|
|
class ShuffledInput(InputReader):
|
|
|
|
"""Randomizes data over a sliding window buffer of N batches.
|
|
|
|
|
|
|
|
This increases the randomization of the data, which is useful if the
|
|
|
|
batches were not in random order to start with.
|
|
|
|
"""
|
|
|
|
|
|
|
|
@DeveloperAPI
|
2020-07-27 14:01:17 -07:00
|
|
|
def __init__(self, child: InputReader, n: int = 0):
|
2021-11-01 10:59:53 +01:00
|
|
|
"""Initializes a ShuffledInput instance.
|
2019-02-13 16:25:05 -08:00
|
|
|
|
2020-09-20 11:27:02 +02:00
|
|
|
Args:
|
2021-11-01 10:59:53 +01:00
|
|
|
child: child input reader to shuffle.
|
|
|
|
n: If positive, shuffle input over this many batches.
|
2019-02-13 16:25:05 -08:00
|
|
|
"""
|
|
|
|
self.n = n
|
|
|
|
self.child = child
|
|
|
|
self.buffer = []
|
|
|
|
|
|
|
|
@override(InputReader)
|
2020-07-27 14:01:17 -07:00
|
|
|
def next(self) -> SampleBatchType:
|
2019-02-13 16:25:05 -08:00
|
|
|
if self.n <= 1:
|
|
|
|
return self.child.next()
|
|
|
|
if len(self.buffer) < self.n:
|
|
|
|
logger.info("Filling shuffle buffer to {} batches".format(self.n))
|
|
|
|
while len(self.buffer) < self.n:
|
|
|
|
self.buffer.append(self.child.next())
|
|
|
|
logger.info("Shuffle buffer filled")
|
|
|
|
i = random.randint(0, len(self.buffer) - 1)
|
|
|
|
self.buffer[i] = self.child.next()
|
|
|
|
return random.choice(self.buffer)
|