[Datasets] Make BlockMetadata a dataclass (#23852)

This commit is contained in:
Balaji Veeramani 2022-04-20 22:46:25 -07:00 committed by GitHub
parent 0e6c042e29
commit 371d1f4533
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -1,3 +1,4 @@
from dataclasses import dataclass
import time
from typing import (
TypeVar,
@ -142,6 +143,7 @@ class _BlockExecStatsBuilder:
@DeveloperAPI
@dataclass
class BlockMetadata:
"""Metadata about the block.
@ -154,22 +156,15 @@ class BlockMetadata:
exec_stats: Execution stats for this block.
"""
def __init__(
self,
*,
num_rows: Optional[int],
size_bytes: Optional[int],
schema: Union[type, "pyarrow.lib.Schema"],
input_files: List[str],
exec_stats: Optional[BlockExecStats]
):
if input_files is None:
input_files = []
self.num_rows: Optional[int] = num_rows
self.size_bytes: Optional[int] = size_bytes
self.schema: Optional[Any] = schema
self.input_files: List[str] = input_files
self.exec_stats: Optional[BlockExecStats] = exec_stats
num_rows: Optional[int]
size_bytes: Optional[int]
schema: Optional[Union[type, "pyarrow.lib.Schema"]]
input_files: Optional[List[str]]
exec_stats: Optional[BlockExecStats]
def __post_init__(self):
if self.input_files is None:
self.input_files = []
@DeveloperAPI