2022-01-27 22:14:36 +01:00
|
|
|
.. _data_api:
|
|
|
|
|
2022-02-05 18:59:34 -06:00
|
|
|
Ray Datasets API
|
|
|
|
================
|
2021-07-14 23:27:13 -07:00
|
|
|
|
2022-01-27 22:14:36 +01:00
|
|
|
Creating Datasets
|
|
|
|
-----------------
|
|
|
|
|
2021-07-15 09:50:37 -07:00
|
|
|
.. autofunction:: ray.data.range
|
2022-05-17 01:09:45 -07:00
|
|
|
.. autofunction:: ray.data.range_table
|
2021-08-01 22:45:21 -07:00
|
|
|
.. autofunction:: ray.data.range_tensor
|
2021-07-15 09:50:37 -07:00
|
|
|
.. autofunction:: ray.data.read_csv
|
|
|
|
.. autofunction:: ray.data.read_json
|
|
|
|
.. autofunction:: ray.data.read_parquet
|
2021-08-01 22:45:21 -07:00
|
|
|
.. autofunction:: ray.data.read_numpy
|
|
|
|
.. autofunction:: ray.data.read_text
|
2021-07-15 09:50:37 -07:00
|
|
|
.. autofunction:: ray.data.read_binary_files
|
|
|
|
.. autofunction:: ray.data.read_datasource
|
2021-08-04 13:31:10 -07:00
|
|
|
.. autofunction:: ray.data.from_items
|
2021-07-28 21:12:01 -07:00
|
|
|
.. autofunction:: ray.data.from_arrow
|
2021-10-01 13:08:25 -07:00
|
|
|
.. autofunction:: ray.data.from_arrow_refs
|
2022-05-06 22:09:28 +02:00
|
|
|
.. autofunction:: ray.data.from_huggingface
|
2021-07-15 09:50:37 -07:00
|
|
|
.. autofunction:: ray.data.from_spark
|
|
|
|
.. autofunction:: ray.data.from_dask
|
|
|
|
.. autofunction:: ray.data.from_modin
|
|
|
|
.. autofunction:: ray.data.from_mars
|
|
|
|
.. autofunction:: ray.data.from_pandas
|
2021-10-01 13:08:25 -07:00
|
|
|
.. autofunction:: ray.data.from_pandas_refs
|
2021-08-27 13:33:11 -07:00
|
|
|
.. autofunction:: ray.data.from_numpy
|
2022-04-12 18:37:59 -07:00
|
|
|
.. autofunction:: ray.data.from_numpy_refs
|
2021-07-14 23:27:13 -07:00
|
|
|
|
2021-10-12 14:03:10 -07:00
|
|
|
.. _dataset-api:
|
|
|
|
|
2021-07-14 23:27:13 -07:00
|
|
|
Dataset API
|
|
|
|
-----------
|
|
|
|
|
2021-07-15 09:50:37 -07:00
|
|
|
.. autoclass:: ray.data.Dataset
|
2021-07-14 23:27:13 -07:00
|
|
|
:members:
|
|
|
|
|
2021-10-12 14:03:10 -07:00
|
|
|
.. _dataset-pipeline-api:
|
|
|
|
|
2022-04-16 11:57:38 -07:00
|
|
|
Block API
|
|
|
|
---------
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.block.BlockExecStats
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.block.BlockMetadata
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.block.BlockAccessor
|
|
|
|
:members:
|
|
|
|
|
|
|
|
DatasetContext API
|
|
|
|
------------------
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.context.DatasetContext
|
|
|
|
:members:
|
|
|
|
|
2021-07-28 21:12:01 -07:00
|
|
|
DatasetPipeline API
|
|
|
|
-------------------
|
|
|
|
|
2021-08-04 13:31:10 -07:00
|
|
|
.. autoclass:: ray.data.dataset_pipeline.DatasetPipeline
|
2021-07-28 21:12:01 -07:00
|
|
|
:members:
|
|
|
|
|
2021-10-19 19:53:13 -07:00
|
|
|
GroupedDataset API
|
|
|
|
------------------
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.grouped_dataset.GroupedDataset
|
|
|
|
:members:
|
|
|
|
|
2022-04-16 11:57:38 -07:00
|
|
|
Aggregate API
|
|
|
|
-------------
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.aggregate.AggregateFn
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.aggregate.Count
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.aggregate.Sum
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.aggregate.Max
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.aggregate.Mean
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.aggregate.Std
|
|
|
|
:members:
|
|
|
|
|
2022-04-25 13:12:59 -07:00
|
|
|
.. autoclass:: ray.data.aggregate.AbsMax
|
|
|
|
:members:
|
|
|
|
|
2022-03-17 15:01:12 -07:00
|
|
|
RandomAccessDataset API
|
|
|
|
-----------------------
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.random_access_dataset.RandomAccessDataset
|
|
|
|
:members:
|
|
|
|
|
2021-09-08 10:09:01 -07:00
|
|
|
Tensor Column Extension API
|
|
|
|
---------------------------
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.extensions.tensor_extension.TensorDtype
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.extensions.tensor_extension.TensorArray
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.extensions.tensor_extension.ArrowTensorType
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.extensions.tensor_extension.ArrowTensorArray
|
|
|
|
:members:
|
|
|
|
|
2021-07-14 23:27:13 -07:00
|
|
|
Custom Datasource API
|
|
|
|
---------------------
|
|
|
|
|
2021-07-15 09:50:37 -07:00
|
|
|
.. autoclass:: ray.data.Datasource
|
2021-07-14 23:27:13 -07:00
|
|
|
:members:
|
|
|
|
|
2021-07-15 09:50:37 -07:00
|
|
|
.. autoclass:: ray.data.ReadTask
|
2021-07-14 23:27:13 -07:00
|
|
|
:members:
|
|
|
|
|
2022-05-23 09:34:41 -07:00
|
|
|
Datasource Partitioning API
|
|
|
|
---------------------------
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.PartitionStyle
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.PathPartitionScheme
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.PathPartitionEncoder
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.PathPartitionParser
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.PathPartitionFilter
|
|
|
|
|
2022-04-28 11:56:45 -07:00
|
|
|
Built-in Datasources
|
|
|
|
--------------------
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.BinaryDatasource
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.CSVDatasource
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.FileBasedDatasource
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.JSONDatasource
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.NumpyDatasource
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.ParquetDatasource
|
|
|
|
:members:
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.datasource.RangeDatasource
|
|
|
|
:members:
|
2022-05-23 09:34:41 -07:00
|
|
|
|
2022-04-29 12:15:30 -07:00
|
|
|
.. autoclass:: ray.data.datasource.SimpleTensorFlowDatasource
|
|
|
|
:members:
|
|
|
|
|
2022-04-28 11:56:45 -07:00
|
|
|
.. autoclass:: ray.data.datasource.SimpleTorchDatasource
|
|
|
|
:members:
|
|
|
|
|
2022-02-14 14:56:17 -06:00
|
|
|
Table Row API
|
|
|
|
---------------------
|
|
|
|
|
|
|
|
.. autoclass:: ray.data.row.TableRow
|
|
|
|
:members:
|
|
|
|
|
2021-07-30 09:51:21 -07:00
|
|
|
Utility
|
|
|
|
-------
|
|
|
|
.. autofunction:: ray.data.set_progress_bars
|