ray/rllib/offline/json_reader.py

import glob
import json
import logging
import os
from pathlib import Path
import random
import re
from typing import List, Optional
from urllib.parse import urlparse
import zipfile

try:
    from smart_open import smart_open
except ImportError:
    smart_open = None

from ray.rllib.offline.input_reader import InputReader
from ray.rllib.offline.io_context import IOContext
from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID, MultiAgentBatch, \
    SampleBatch
from ray.rllib.utils.annotations import override, PublicAPI
from ray.rllib.utils.compression import unpack_if_needed
from ray.rllib.utils.spaces.space_utils import clip_action, normalize_action
from ray.rllib.utils.typing import FileType, SampleBatchType

logger = logging.getLogger(__name__)

WINDOWS_DRIVES = [chr(i) for i in range(ord("c"), ord("z") + 1)]


@PublicAPI
class JsonReader(InputReader):
    """Reader object that loads experiences from JSON file chunks.

    The input files will be read from in an random order."""

    @PublicAPI
    def __init__(self, inputs: List[str], ioctx: IOContext = None):
        """Initialize a JsonReader.

        Args:
            inputs (str|list): Either a glob expression for files, e.g.,
                "/tmp/**/*.json", or a list of single file paths or URIs, e.g.,
                ["s3://bucket/file.json", "s3://bucket/file2.json"].
            ioctx (IOContext): Current IO context object.
        """

        self.ioctx = ioctx or IOContext()
        self.default_policy = None
        if self.ioctx.worker is not None:
            self.default_policy = \
                self.ioctx.worker.policy_map.get(DEFAULT_POLICY_ID)
        if isinstance(inputs, str):
            inputs = os.path.abspath(os.path.expanduser(inputs))
            if os.path.isdir(inputs):
                inputs = [
                    os.path.join(inputs, "*.json"),
                    os.path.join(inputs, "*.zip")
                ]
                logger.warning(
                    f"Treating input directory as glob patterns: {inputs}")
            else:
                inputs = [inputs]

            if any(
                    urlparse(i).scheme not in [""] + WINDOWS_DRIVES
                    for i in inputs):
                raise ValueError(
                    "Don't know how to glob over `{}`, ".format(inputs) +
                    "please specify a list of files to read instead.")
            else:
                self.files = []
                for i in inputs:
                    self.files.extend(glob.glob(i))
        elif type(inputs) is list:
            self.files = inputs
        else:
            raise ValueError(
                "type of inputs must be list or str, not {}".format(inputs))
        if self.files:
            logger.info("Found {} input files.".format(len(self.files)))
        else:
            raise ValueError("No files found matching {}".format(inputs))
        self.cur_file = None

    @override(InputReader)
    def next(self) -> SampleBatchType:
        batch = self._try_parse(self._next_line())
        tries = 0
        while not batch and tries < 100:
            tries += 1
            logger.debug("Skipping empty line in {}".format(self.cur_file))
            batch = self._try_parse(self._next_line())
        if not batch:
            raise ValueError(
                "Failed to read valid experience batch from file: {}".format(
                    self.cur_file))

        return self._postprocess_if_needed(batch)

    def _postprocess_if_needed(self,
                               batch: SampleBatchType) -> SampleBatchType:
        if not self.ioctx.config.get("postprocess_inputs"):
            return batch

        if isinstance(batch, SampleBatch):
            out = []
            for sub_batch in batch.split_by_episode():
                out.append(
                    self.default_policy.postprocess_trajectory(sub_batch))
            return SampleBatch.concat_samples(out)
        else:
            # TODO(ekl) this is trickier since the alignments between agent
            #  trajectories in the episode are not available any more.
            raise NotImplementedError(
                "Postprocessing of multi-agent data not implemented yet.")

    def _try_open_file(self, path):
        if urlparse(path).scheme not in [""] + WINDOWS_DRIVES:
            if smart_open is None:
                raise ValueError(
                    "You must install the `smart_open` module to read "
                    "from URIs like {}".format(path))
            ctx = smart_open
        else:
            # If path doesn't exist, try to interpret is as relative to the
            # rllib directory (located ../../ from this very module).
            path_orig = path
            if not os.path.exists(path):
                path = os.path.join(Path(__file__).parent.parent, path)
            if not os.path.exists(path):
                raise FileNotFoundError(f"Offline file {path_orig} not found!")

            # Unzip files, if necessary and re-point to extracted json file.
            if re.search("\\.zip$", path):
                with zipfile.ZipFile(path, "r") as zip_ref:
                    zip_ref.extractall(Path(path).parent)
                path = re.sub("\\.zip$", ".json", path)
                assert os.path.exists(path)
            ctx = open
        file = ctx(path, "r")
        return file

    def _try_parse(self, line: str) -> Optional[SampleBatchType]:
        line = line.strip()
        if not line:
            return None
        try:
            batch = _from_json(line)
        except Exception:
            logger.exception("Ignoring corrupt json record in {}: {}".format(
                self.cur_file, line))
            return None

        # Clip actions (from any values into env's bounds), if necessary.
        cfg = self.ioctx.config
        if cfg.get("clip_actions"):
            if isinstance(batch, SampleBatch):
                batch[SampleBatch.ACTIONS] = clip_action(
                    batch[SampleBatch.ACTIONS], self.ioctx.worker.policy_map[
                        "default_policy"].action_space_struct)
            else:
                for pid, b in batch.policy_batches.items():
                    b[SampleBatch.ACTIONS] = clip_action(
                        b[SampleBatch.ACTIONS],
                        self.ioctx.worker.policy_map[pid].action_space_struct)
        # Re-normalize actions (from env's bounds to 0.0 centered), if
        # necessary.
        if cfg.get("actions_in_input_normalized") is False:
            if isinstance(batch, SampleBatch):
                batch[SampleBatch.ACTIONS] = normalize_action(
                    batch[SampleBatch.ACTIONS], self.ioctx.worker.policy_map[
                        "default_policy"].action_space_struct)
            else:
                for pid, b in batch.policy_batches.items():
                    b[SampleBatch.ACTIONS] = normalize_action(
                        b[SampleBatch.ACTIONS],
                        self.ioctx.worker.policy_map[pid].action_space_struct)
        return batch

    def read_all_files(self):
        for path in self.files:
            file = self._try_open_file(path)
            while True:
                line = file.readline()
                if not line:
                    break
                batch = self._try_parse(line)
                if batch is None:
                    break
                yield batch

    def _next_line(self) -> str:
        if not self.cur_file:
            self.cur_file = self._next_file()
        line = self.cur_file.readline()
        tries = 0
        while not line and tries < 100:
            tries += 1
            if hasattr(self.cur_file, "close"):  # legacy smart_open impls
                self.cur_file.close()
            self.cur_file = self._next_file()
            line = self.cur_file.readline()
            if not line:
                logger.debug("Ignoring empty file {}".format(self.cur_file))
        if not line:
            raise ValueError("Failed to read next line from files: {}".format(
                self.files))
        return line

    def _next_file(self) -> FileType:
        # If this is the first time, we open a file, make sure all workers
        # start with a different one if possible.
        if self.cur_file is None and self.ioctx.worker is not None:
            idx = self.ioctx.worker.worker_index
            total = self.ioctx.worker.num_workers or 1
            path = self.files[round((len(self.files) - 1) * (idx / total))]
        # After the first file, pick all others randomly.
        else:
            path = random.choice(self.files)
        return self._try_open_file(path)


def _from_json(batch: str) -> SampleBatchType:
    if isinstance(batch, bytes):  # smart_open S3 doesn't respect "r"
        batch = batch.decode("utf-8")
    data = json.loads(batch)

    if "type" in data:
        data_type = data.pop("type")
    else:
        raise ValueError("JSON record missing 'type' field")

    if data_type == "SampleBatch":
        for k, v in data.items():
            data[k] = unpack_if_needed(v)
        return SampleBatch(data)
    elif data_type == "MultiAgentBatch":
        policy_batches = {}
        for policy_id, policy_batch in data["policy_batches"].items():
            inner = {}
            for k, v in policy_batch.items():
                inner[k] = unpack_if_needed(v)
            policy_batches[policy_id] = SampleBatch(inner)
        return MultiAgentBatch(policy_batches, data["count"])
    else:
        raise ValueError(
            "Type field must be one of ['SampleBatch', 'MultiAgentBatch']",
            data_type)
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`import glob`
			`import json`
			`import logging`
			`import os`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`from pathlib import Path`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`import random`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`import re`
[RLlib] MARWIL + BC: Various fixes and enhancements. (#16218) 2021-06-03 22:29:00 +02:00			`from typing import List, Optional`
Remove six and cloudpickle from setup.py. (#7694) 2020-03-23 11:42:05 -07:00			`from urllib.parse import urlparse`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`import zipfile`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00
			`try:`
			`from smart_open import smart_open`
			`except ImportError:`
			`smart_open = None`

			`from ray.rllib.offline.input_reader import InputReader`
[rllib] Documentation for I/O API and multi-agent support / cleanup (#3650) 2019-01-03 15:15:36 +08:00			`from ray.rllib.offline.io_context import IOContext`
[RLlib] BC/MARWIL/recurrent nets minor cleanups and bug fixes. (#13064) 2020-12-27 09:46:03 -05:00			`from ray.rllib.policy.sample_batch import DEFAULT_POLICY_ID, MultiAgentBatch, \`
			`SampleBatch`
[rllib] annotate public vs developer vs private APIs (#3808) 2019-01-23 21:27:26 -08:00			`from ray.rllib.utils.annotations import override, PublicAPI`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`from ray.rllib.utils.compression import unpack_if_needed`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`from ray.rllib.utils.spaces.space_utils import clip_action, normalize_action`
[RLlib] Rename rllib.utils.types into typing to match built-in python module's name. (#10114) 2020-08-15 13:24:22 +02:00			`from ray.rllib.utils.typing import FileType, SampleBatchType`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00
			`logger = logging.getLogger(__name__)`

[RLlib] Support windows drives other than C drive for the offline json API (#9909) 2020-08-13 05:57:54 -04:00			`WINDOWS_DRIVES = [chr(i) for i in range(ord("c"), ord("z") + 1)]`

[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00
[rllib] annotate public vs developer vs private APIs (#3808) 2019-01-23 21:27:26 -08:00			`@PublicAPI`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`class JsonReader(InputReader):`
			`"""Reader object that loads experiences from JSON file chunks.`

			`The input files will be read from in an random order."""`

[rllib] annotate public vs developer vs private APIs (#3808) 2019-01-23 21:27:26 -08:00			`@PublicAPI`
[RLlib] Offline Type Annotations (#9676) * Offline Annotations * Modifications * Fixed circular dependencies * Linter fix 2020-07-27 14:01:17 -07:00			`def __init__(self, inputs: List[str], ioctx: IOContext = None):`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`"""Initialize a JsonReader.`

[RLlib] SAC algo cleanup. (#10825) 2020-09-20 11:27:02 +02:00			`Args:`
[RLlib] JSONReader: Mix files if > 1 at beginning (each worker should start with different file). (#14865) 2021-03-24 16:07:40 +01:00			`inputs (str\|list): Either a glob expression for files, e.g.,`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`"/tmp/*/.json", or a list of single file paths or URIs, e.g.,`
			`["s3://bucket/file.json", "s3://bucket/file2.json"].`
[RLlib] JSONReader: Mix files if > 1 at beginning (each worker should start with different file). (#14865) 2021-03-24 16:07:40 +01:00			`ioctx (IOContext): Current IO context object.`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`"""`

[rllib] Documentation for I/O API and multi-agent support / cleanup (#3650) 2019-01-03 15:15:36 +08:00			`self.ioctx = ioctx or IOContext()`
[RLlib] BC/MARWIL/recurrent nets minor cleanups and bug fixes. (#13064) 2020-12-27 09:46:03 -05:00			`self.default_policy = None`
			`if self.ioctx.worker is not None:`
			`self.default_policy = \`
			`self.ioctx.worker.policy_map.get(DEFAULT_POLICY_ID)`
Remove six and cloudpickle from setup.py. (#7694) 2020-03-23 11:42:05 -07:00			`if isinstance(inputs, str):`
[rllib] Basic infrastructure for off-policy estimation (IS, WIS) (#3941) 2019-02-13 16:25:05 -08:00			`inputs = os.path.abspath(os.path.expanduser(inputs))`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`if os.path.isdir(inputs):`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`inputs = [`
			`os.path.join(inputs, "*.json"),`
			`os.path.join(inputs, "*.zip")`
			`]`
Remove deprecation warnings when running actor tests (#3563) * remove deprecation warnings when running actor tests * replacing logger.warn with logger.warning * Update worker.py * Update policy_client.py * Update compression.py 2018-12-18 17:04:51 -08:00			`logger.warning(`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`f"Treating input directory as glob patterns: {inputs}")`
			`else:`
			`inputs = [inputs]`

			`if any(`
			`urlparse(i).scheme not in [""] + WINDOWS_DRIVES`
			`for i in inputs):`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`raise ValueError(`
			"Don't know how to glob over `{}`, ".format(inputs) +
			`"please specify a list of files to read instead.")`
			`else:`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`self.files = []`
			`for i in inputs:`
			`self.files.extend(glob.glob(i))`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`elif type(inputs) is list:`
			`self.files = inputs`
			`else:`
			`raise ValueError(`
			`"type of inputs must be list or str, not {}".format(inputs))`
			`if self.files:`
			`logger.info("Found {} input files.".format(len(self.files)))`
			`else:`
			`raise ValueError("No files found matching {}".format(inputs))`
			`self.cur_file = None`

			`@override(InputReader)`
[RLlib] Offline Type Annotations (#9676) * Offline Annotations * Modifications * Fixed circular dependencies * Linter fix 2020-07-27 14:01:17 -07:00			`def next(self) -> SampleBatchType:`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`batch = self._try_parse(self._next_line())`
			`tries = 0`
			`while not batch and tries < 100:`
			`tries += 1`
			`logger.debug("Skipping empty line in {}".format(self.cur_file))`
			`batch = self._try_parse(self._next_line())`
			`if not batch:`
			`raise ValueError(`
			`"Failed to read valid experience batch from file: {}".format(`
			`self.cur_file))`
[RLlib] MARWIL + BC: Various fixes and enhancements. (#16218) 2021-06-03 22:29:00 +02:00
[rllib] Documentation for I/O API and multi-agent support / cleanup (#3650) 2019-01-03 15:15:36 +08:00			`return self._postprocess_if_needed(batch)`

[RLlib] Offline Type Annotations (#9676) * Offline Annotations * Modifications * Fixed circular dependencies * Linter fix 2020-07-27 14:01:17 -07:00			`def _postprocess_if_needed(self,`
			`batch: SampleBatchType) -> SampleBatchType:`
[rllib] Documentation for I/O API and multi-agent support / cleanup (#3650) 2019-01-03 15:15:36 +08:00			`if not self.ioctx.config.get("postprocess_inputs"):`
			`return batch`

			`if isinstance(batch, SampleBatch):`
			`out = []`
			`for sub_batch in batch.split_by_episode():`
[RLlib] BC/MARWIL/recurrent nets minor cleanups and bug fixes. (#13064) 2020-12-27 09:46:03 -05:00			`out.append(`
			`self.default_policy.postprocess_trajectory(sub_batch))`
[rllib] Documentation for I/O API and multi-agent support / cleanup (#3650) 2019-01-03 15:15:36 +08:00			`return SampleBatch.concat_samples(out)`
			`else:`
			`# TODO(ekl) this is trickier since the alignments between agent`
[RLlib] Behavioral Cloning (from MARWIL). (#10619) 2020-09-09 17:33:21 +02:00			`# trajectories in the episode are not available any more.`
[rllib] Documentation for I/O API and multi-agent support / cleanup (#3650) 2019-01-03 15:15:36 +08:00			`raise NotImplementedError(`
			`"Postprocessing of multi-agent data not implemented yet.")`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`def _try_open_file(self, path):`
			`if urlparse(path).scheme not in [""] + WINDOWS_DRIVES:`
			`if smart_open is None:`
			`raise ValueError(`
			"You must install the `smart_open` module to read "
			`"from URIs like {}".format(path))`
			`ctx = smart_open`
			`else:`
			`# If path doesn't exist, try to interpret is as relative to the`
			`# rllib directory (located ../../ from this very module).`
			`path_orig = path`
			`if not os.path.exists(path):`
			`path = os.path.join(Path(__file__).parent.parent, path)`
			`if not os.path.exists(path):`
			`raise FileNotFoundError(f"Offline file {path_orig} not found!")`

			`# Unzip files, if necessary and re-point to extracted json file.`
			`if re.search("\\.zip$", path):`
			`with zipfile.ZipFile(path, "r") as zip_ref:`
			`zip_ref.extractall(Path(path).parent)`
			`path = re.sub("\\.zip$", ".json", path)`
			`assert os.path.exists(path)`
			`ctx = open`
			`file = ctx(path, "r")`
			`return file`

[RLlib] MARWIL + BC: Various fixes and enhancements. (#16218) 2021-06-03 22:29:00 +02:00			`def _try_parse(self, line: str) -> Optional[SampleBatchType]:`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`line = line.strip()`
			`if not line:`
			`return None`
			`try:`
[RLlib] MARWIL + BC: Various fixes and enhancements. (#16218) 2021-06-03 22:29:00 +02:00			`batch = _from_json(line)`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`except Exception:`
			`logger.exception("Ignoring corrupt json record in {}: {}".format(`
			`self.cur_file, line))`
			`return None`

[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`# Clip actions (from any values into env's bounds), if necessary.`
			`cfg = self.ioctx.config`
			`if cfg.get("clip_actions"):`
[RLlib] MARWIL + BC: Various fixes and enhancements. (#16218) 2021-06-03 22:29:00 +02:00			`if isinstance(batch, SampleBatch):`
			`batch[SampleBatch.ACTIONS] = clip_action(`
			`batch[SampleBatch.ACTIONS], self.ioctx.worker.policy_map[`
			`"default_policy"].action_space_struct)`
			`else:`
			`for pid, b in batch.policy_batches.items():`
			`b[SampleBatch.ACTIONS] = clip_action(`
			`b[SampleBatch.ACTIONS],`
			`self.ioctx.worker.policy_map[pid].action_space_struct)`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`# Re-normalize actions (from env's bounds to 0.0 centered), if`
			`# necessary.`
[RLlib] Implement policy_maps (multi-agent case) in RolloutWorkers as LRU caches. (#17031) 2021-07-19 13:16:03 -04:00			`if cfg.get("actions_in_input_normalized") is False:`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`if isinstance(batch, SampleBatch):`
			`batch[SampleBatch.ACTIONS] = normalize_action(`
			`batch[SampleBatch.ACTIONS], self.ioctx.worker.policy_map[`
			`"default_policy"].action_space_struct)`
			`else:`
			`for pid, b in batch.policy_batches.items():`
			`b[SampleBatch.ACTIONS] = normalize_action(`
			`b[SampleBatch.ACTIONS],`
			`self.ioctx.worker.policy_map[pid].action_space_struct)`
[RLlib] MARWIL + BC: Various fixes and enhancements. (#16218) 2021-06-03 22:29:00 +02:00			`return batch`

[RLlib] CQL loss fn fixes, MuJoCo + Pendulum benchmarks, offline-RL example script w/ json file. (#15603) Co-authored-by: Sven Mika <sven@anyscale.io> Co-authored-by: sven1977 <svenmika1977@gmail.com> 2021-05-04 10:06:19 -07:00			`def read_all_files(self):`
			`for path in self.files:`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`file = self._try_open_file(path)`
			`while True:`
			`line = file.readline()`
			`if not line:`
			`break`
			`batch = self._try_parse(line)`
			`if batch is None:`
			`break`
			`yield batch`
[RLlib] CQL loss fn fixes, MuJoCo + Pendulum benchmarks, offline-RL example script w/ json file. (#15603) Co-authored-by: Sven Mika <sven@anyscale.io> Co-authored-by: sven1977 <svenmika1977@gmail.com> 2021-05-04 10:06:19 -07:00
[RLlib] Offline Type Annotations (#9676) * Offline Annotations * Modifications * Fixed circular dependencies * Linter fix 2020-07-27 14:01:17 -07:00			`def _next_line(self) -> str:`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`if not self.cur_file:`
			`self.cur_file = self._next_file()`
			`line = self.cur_file.readline()`
			`tries = 0`
			`while not line and tries < 100:`
			`tries += 1`
			`if hasattr(self.cur_file, "close"): # legacy smart_open impls`
			`self.cur_file.close()`
			`self.cur_file = self._next_file()`
			`line = self.cur_file.readline()`
			`if not line:`
			`logger.debug("Ignoring empty file {}".format(self.cur_file))`
			`if not line:`
			`raise ValueError("Failed to read next line from files: {}".format(`
			`self.files))`
			`return line`

[RLlib] Offline Type Annotations (#9676) * Offline Annotations * Modifications * Fixed circular dependencies * Linter fix 2020-07-27 14:01:17 -07:00			`def _next_file(self) -> FileType:`
[RLlib] JSONReader: Mix files if > 1 at beginning (each worker should start with different file). (#14865) 2021-03-24 16:07:40 +01:00			`# If this is the first time, we open a file, make sure all workers`
			`# start with a different one if possible.`
			`if self.cur_file is None and self.ioctx.worker is not None:`
			`idx = self.ioctx.worker.worker_index`
			`total = self.ioctx.worker.num_workers or 1`
			`path = self.files[round((len(self.files) - 1) * (idx / total))]`
			`# After the first file, pick all others randomly.`
			`else:`
			`path = random.choice(self.files)`
[RLlib] CQL BC loss fixes; PPO/PG/A2\|3C action normalization fixes (#16531) 2021-06-30 12:32:11 +02:00			`return self._try_open_file(path)`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00

[RLlib] Offline Type Annotations (#9676) * Offline Annotations * Modifications * Fixed circular dependencies * Linter fix 2020-07-27 14:01:17 -07:00			`def _from_json(batch: str) -> SampleBatchType:`
[rllib] Basic Offline Data IO API (#3473) 2018-12-12 13:57:48 -08:00			`if isinstance(batch, bytes): # smart_open S3 doesn't respect "r"`
			`batch = batch.decode("utf-8")`
			`data = json.loads(batch)`
[rllib] Documentation for I/O API and multi-agent support / cleanup (#3650) 2019-01-03 15:15:36 +08:00
			`if "type" in data:`
			`data_type = data.pop("type")`
			`else:`
			`raise ValueError("JSON record missing 'type' field")`

			`if data_type == "SampleBatch":`
			`for k, v in data.items():`
			`data[k] = unpack_if_needed(v)`
			`return SampleBatch(data)`
			`elif data_type == "MultiAgentBatch":`
			`policy_batches = {}`
			`for policy_id, policy_batch in data["policy_batches"].items():`
			`inner = {}`
			`for k, v in policy_batch.items():`
			`inner[k] = unpack_if_needed(v)`
			`policy_batches[policy_id] = SampleBatch(inner)`
			`return MultiAgentBatch(policy_batches, data["count"])`
			`else:`
			`raise ValueError(`
			`"Type field must be one of ['SampleBatch', 'MultiAgentBatch']",`
			`data_type)`