@@ -1163,7 +1163,7 @@ def map(
1163
1163
keep_in_memory (`bool`, defaults to `False`): Keep the dataset in memory instead of writing it to a cache file.
1164
1164
load_from_cache_file (`bool`, defaults to `True`): If a cache file storing the current computation from `function`
1165
1165
can be identified, use it instead of recomputing.
1166
- cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a cache file to use to store the
1166
+ cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a path for the cache file. It is used to store the
1167
1167
results of the computation instead of the automatically generated cache file name.
1168
1168
writer_batch_size (`int`, defaults to `1000`): Number of rows per write operation for the cache file writer.
1169
1169
Higher value gives smaller cache files, lower value consume less temporary memory while running `.map()`.
@@ -1369,7 +1369,7 @@ def _map_single(
1369
1369
keep_in_memory (`bool`, defaults to `False`): Keep the dataset in memory instead of writing it to a cache file.
1370
1370
load_from_cache_file (`bool`, defaults to `True`): If a cache file storing the current computation from `function`
1371
1371
can be identified, use it instead of recomputing.
1372
- cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a cache file to use to store the
1372
+ cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a path for the cache file. It is used to store the
1373
1373
results of the computation instead of the automatically generated cache file name.
1374
1374
writer_batch_size (`int`, defaults to `1000`): Number of rows per write operation for the cache file writer.
1375
1375
Higher value gives smaller cache files, lower value consume less temporary memory while running `.map()`.
@@ -1590,7 +1590,7 @@ def filter(
1590
1590
keep_in_memory (`bool`, defaults to `False`): Keep the dataset in memory instead of writing it to a cache file.
1591
1591
load_from_cache_file (`bool`, defaults to `True`): If a cache file storing the current computation from `function`
1592
1592
can be identified, use it instead of recomputing.
1593
- cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a cache file to use to store the
1593
+ cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a path for the cache file. It is used to store the
1594
1594
results of the computation instead of the automatically generated cache file name.
1595
1595
writer_batch_size (`int`, defaults to `1000`): Number of rows per write operation for the cache file writer.
1596
1596
Higher value gives smaller cache files, lower value consume less temporary memory while running `.map()`.
@@ -1660,7 +1660,7 @@ def flatten_indices(
1660
1660
1661
1661
Args:
1662
1662
keep_in_memory (`bool`, default: `False`): Keep the dataset in memory instead of writing it to a cache file.
1663
- cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a cache file to use to store the
1663
+ cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a path for the cache file. It is used to store the
1664
1664
results of the computation instead of the automatically generated cache file name.
1665
1665
writer_batch_size (`int`, defaults to `1000`): Number of rows per write operation for the cache file writer.
1666
1666
Higher value gives smaller cache files, lower value consume less temporary memory while running `.map()`.
@@ -1736,7 +1736,7 @@ def select(
1736
1736
Args:
1737
1737
`indices` (sequence, iterable, ndarray or Series): List or 1D-array of integer indices for indexing.
1738
1738
`keep_in_memory` (`bool`, default: `False`): Keep the indices mapping in memory instead of writing it to a cache file.
1739
- `indices_cache_file_name` (`Optional[str]`, default: `None`): Provide the name of a cache file to use to store the
1739
+ `indices_cache_file_name` (`Optional[str]`, default: `None`): Provide the name of a path for the cache file. It is used to store the
1740
1740
indices mapping instead of the automatically generated cache file name.
1741
1741
`writer_batch_size` (`int`, default: `1000`): Number of rows per write operation for the cache file writer.
1742
1742
Higher value gives smaller cache files, lower value consume less temporary memory while running `.map()`.
@@ -1830,7 +1830,7 @@ def sort(
1830
1830
keep_in_memory (`bool`, defaults to `False`): Keep the sorted indices in memory instead of writing it to a cache file.
1831
1831
load_from_cache_file (`bool`, defaults to `True`): If a cache file storing the sorted indices
1832
1832
can be identified, use it instead of recomputing.
1833
- indices_cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a cache file to use to store the
1833
+ indices_cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a path for the cache file. It is used to store the
1834
1834
sorted indices instead of the automatically generated cache file name.
1835
1835
writer_batch_size (`int`, defaults to `1000`): Number of rows per write operation for the cache file writer.
1836
1836
Higher value gives smaller cache files, lower value consume less temporary memory.
@@ -1906,7 +1906,7 @@ def shuffle(
1906
1906
keep_in_memory (`bool`, defaults to `False`): Keep the shuffled indices in memory instead of writing it to a cache file.
1907
1907
load_from_cache_file (`bool`, defaults to `True`): If a cache file storing the shuffled indices
1908
1908
can be identified, use it instead of recomputing.
1909
- indices_cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a cache file to use to store the
1909
+ indices_cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a path for the cache file. It is used to store the
1910
1910
shuffled indices instead of the automatically generated cache file name.
1911
1911
writer_batch_size (`int`, defaults to `1000`): Number of rows per write operation for the cache file writer.
1912
1912
Higher value gives smaller cache files, lower value consume less temporary memory while running `.map()`.
@@ -1998,9 +1998,9 @@ def train_test_split(
1998
1998
keep_in_memory (`bool`, defaults to `False`): Keep the splits indices in memory instead of writing it to a cache file.
1999
1999
load_from_cache_file (`bool`, defaults to `True`): If a cache file storing the splits indices
2000
2000
can be identified, use it instead of recomputing.
2001
- train_cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a cache file to use to store the
2001
+ train_cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a path for the cache file. It is used to store the
2002
2002
train split indices instead of the automatically generated cache file name.
2003
- test_cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a cache file to use to store the
2003
+ test_cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a path for the cache file. It is used to store the
2004
2004
test split indices instead of the automatically generated cache file name.
2005
2005
writer_batch_size (`int`, defaults to `1000`): Number of rows per write operation for the cache file writer.
2006
2006
Higher value gives smaller cache files, lower value consume less temporary memory while running `.map()`.
@@ -2183,7 +2183,7 @@ def shard(
2183
2183
keep_in_memory (`bool`, defaults to `False`): Keep the dataset in memory instead of writing it to a cache file.
2184
2184
load_from_cache_file (`bool`, defaults to `True`): If a cache file storing the current computation from `function`
2185
2185
can be identified, use it instead of recomputing.
2186
- indices_cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a cache file to use to store the
2186
+ indices_cache_file_name (`Optional[str]`, defaults to `None`): Provide the name of a path for the cache file. It is used to store the
2187
2187
indices of each shard instead of the automatically generated cache file name.
2188
2188
writer_batch_size (`int`, defaults to `1000`): Number of rows per write operation for the cache file writer.
2189
2189
Higher value gives smaller cache files, lower value consume less temporary memory while running `.map()`.
0 commit comments