ray/rllib/execution/replay_ops.py

36 lines
1.2 KiB
Python

from typing import Optional
import random
from ray.rllib.utils.replay_buffers.replay_buffer import warn_replay_capacity
from ray.rllib.utils.typing import SampleBatchType
# TODO(ekl) deprecate this in favor of the replay_sequence_length option.
class SimpleReplayBuffer:
"""Simple replay buffer that operates over batches."""
def __init__(self, num_slots: int, replay_proportion: Optional[float] = None):
"""Initialize SimpleReplayBuffer.
Args:
num_slots: Number of batches to store in total.
"""
self.num_slots = num_slots
self.replay_batches = []
self.replay_index = 0
def add_batch(self, sample_batch: SampleBatchType) -> None:
warn_replay_capacity(item=sample_batch, num_items=self.num_slots)
if self.num_slots > 0:
if len(self.replay_batches) < self.num_slots:
self.replay_batches.append(sample_batch)
else:
self.replay_batches[self.replay_index] = sample_batch
self.replay_index += 1
self.replay_index %= self.num_slots
def replay(self) -> SampleBatchType:
return random.choice(self.replay_batches)
def __len__(self):
return len(self.replay_batches)