Skip to content

Commit 6758d14

Browse files
committed
Ensure arrow FS tokenize
1 parent ecb81f4 commit 6758d14

1 file changed

Lines changed: 7 additions & 1 deletion

File tree

dask/dataframe/io/parquet/arrow.py

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,7 @@
1111
import numpy as np
1212
import pandas as pd
1313
import pyarrow as pa
14+
import pyarrow.fs as pa_fs
1415
import pyarrow.parquet as pq
1516

1617
# Check PyArrow version for feature support
@@ -20,7 +21,7 @@
2021
from pyarrow import fs as pa_fs
2122

2223
import dask
23-
from dask.base import tokenize
24+
from dask.base import normalize_token, tokenize
2425
from dask.core import flatten
2526
from dask.dataframe.backends import pyarrow_schema_dispatch
2627
from dask.dataframe.io.parquet.utils import (
@@ -55,6 +56,11 @@
5556
}
5657

5758

59+
@normalize_token.register(pa_fs.FileSystem)
60+
def tokenize_arrowfs(obj):
61+
return obj.__reduce__()
62+
63+
5864
#
5965
# Helper Utilities
6066
#

0 commit comments

Comments
 (0)