huggingface · kratos0718 · May 27, 2026
diff --git a/src/datasets/arrow_dataset.py b/src/datasets/arrow_dataset.py
@@ -2322,6 +2322,9 @@ def flatten(self, new_fingerprint: Optional[str] = None, max_depth=16) -> "Datas
             new_fingerprint (`str`, *optional*):
                 The new fingerprint of the dataset after transform.
                 If `None`, the new fingerprint is computed using a hash of the previous fingerprint, and the transform arguments.
+            max_depth (`int`, defaults to `16`):
+                Maximum number of nesting levels to flatten. Flattening stops when either
+                all struct columns have been resolved or `max_depth` iterations have been completed.
 
         Returns:
             [`Dataset`]: A copy of the dataset with flattened columns.

diff --git a/src/datasets/load.py b/src/datasets/load.py
@@ -1568,6 +1568,10 @@ def load_dataset(
             Whether to copy the dataset in-memory. If `None`, the dataset
             will not be copied in-memory unless explicitly enabled by setting `datasets.config.IN_MEMORY_MAX_SIZE` to
             nonzero. See more details in the [improve performance](../cache#improve-performance) section.
+        save_infos (`bool`, defaults to `False`):
+            Save the dataset builders' infos (checksums/size/splits/...) by forcing full
+            verification. If `True`, overrides `verification_mode` and sets it to
+            [`VerificationMode.ALL_CHECKS`].
         revision ([`Version`] or `str`, *optional*):
             Version of the dataset to load.
             As datasets have their own git repository on the Datasets Hub, the default version "main" corresponds to their "main" branch.