dask
diff --git a/‎distributed/shuffle/__init__.py‎
Lines changed: 0 additions & 2 deletions b/‎distributed/shuffle/__init__.py‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎distributed/shuffle/_arrow.py‎
Lines changed: 0 additions & 201 deletions b/‎distributed/shuffle/_arrow.py‎
Lines changed: 0 additions & 201 deletions
diff --git a/‎distributed/shuffle/_core.py‎
Lines changed: 3 additions & 12 deletions b/‎distributed/shuffle/_core.py‎
Lines changed: 3 additions & 12 deletions
diff --git a/‎distributed/shuffle/_disk.py‎
Lines changed: 36 additions & 26 deletions b/‎distributed/shuffle/_disk.py‎
Lines changed: 36 additions & 26 deletions
@@ -1,14 +1,12 @@
 from __future__ import annotations
 
-from distributed.shuffle._arrow import check_minimal_arrow_version
 from distributed.shuffle._merge import HashJoinP2PLayer, hash_join_p2p
 from distributed.shuffle._rechunk import rechunk_p2p
 from distributed.shuffle._scheduler_plugin import ShuffleSchedulerPlugin
 from distributed.shuffle._shuffle import P2PShuffleLayer, rearrange_by_column_p2p
 from distributed.shuffle._worker_plugin import ShuffleWorkerPlugin
 
 __all__ = [
-    "check_minimal_arrow_version",
     "hash_join_p2p",
     "HashJoinP2PLayer",
     "P2PShuffleLayer",
 
@@ -19,7 +19,6 @@
 from dataclasses import dataclass, field
 from enum import Enum
 from functools import partial
-from pathlib import Path
 from typing import TYPE_CHECKING, Any, Generic, NewType, TypeVar, cast
 
 from tornado.ioloop import IOLoop
@@ -38,6 +37,7 @@
 from distributed.shuffle._exceptions import ShuffleClosedError
 from distributed.shuffle._limiter import ResourceLimiter
 from distributed.shuffle._memory import MemoryShardsBuffer
+from distributed.sizeof import safe_sizeof as sizeof
 from distributed.utils import run_in_executor_with_context, sync
 from distributed.utils_comm import retry
 
@@ -116,11 +116,10 @@ def __init__(
                 if disk:
                     self._disk_buffer = DiskShardsBuffer(
                         directory=directory,
-                        read=self.read,
                         memory_limiter=memory_limiter_disk,
                     )
                 else:
-                    self._disk_buffer = MemoryShardsBuffer(deserialize=self.deserialize)
+                    self._disk_buffer = MemoryShardsBuffer()
 
             with self._capture_metrics("background-comms"):
                 self._comm_buffer = CommShardsBuffer(
@@ -372,14 +371,6 @@ def _get_output_partition(
     ) -> _T_partition_type:
         """Get an output partition to the shuffle run"""
 
-    @abc.abstractmethod
-    def read(self, path: Path) -> tuple[Any, int]:
-        """Read shards from disk"""
-
-    @abc.abstractmethod
-    def deserialize(self, buffer: Any) -> Any:
-        """Deserialize shards"""
-
 
 def get_worker_plugin() -> ShuffleWorkerPlugin:
     from distributed import get_worker
@@ -518,7 +509,7 @@ def _mean_shard_size(shards: Iterable) -> int:
         if not isinstance(shard, int):
             # This also asserts that shard is a Buffer and that we didn't forget
             # a container or metadata type above
-            size += memoryview(shard).nbytes
+            size += sizeof(shard)
             count += 1
             if count == 10:
                 break
 
@@ -1,21 +1,21 @@
 from __future__ import annotations
 
 import contextlib
+import mmap
 import pathlib
 import shutil
 import threading
-from collections.abc import Callable, Generator, Iterable
+from collections.abc import Generator, Iterator
 from contextlib import contextmanager
+from pathlib import Path
 from typing import Any
 
-from toolz import concat
-
 from distributed.metrics import context_meter, thread_time
 from distributed.shuffle._buffer import ShardsBuffer
 from distributed.shuffle._exceptions import DataUnavailable
 from distributed.shuffle._limiter import ResourceLimiter
-from distributed.shuffle._pickle import pickle_bytelist
-from distributed.utils import Deadline, empty_context, log_errors, nbytes
+from distributed.shuffle._pickle import pickle_bytelist, unpickle_bytestream
+from distributed.utils import Deadline, log_errors, nbytes
 
 
 class ReadWriteLock:
@@ -126,7 +126,6 @@ class DiskShardsBuffer(ShardsBuffer):
     def __init__(
         self,
         directory: str | pathlib.Path,
-        read: Callable[[pathlib.Path], tuple[Any, int]],
         memory_limiter: ResourceLimiter,
     ):
         super().__init__(
@@ -137,11 +136,10 @@ def __init__(
         self.directory = pathlib.Path(directory)
         self.directory.mkdir(exist_ok=True)
         self._closed = False
-        self._read = read
         self._directory_lock = ReadWriteLock()
 
     @log_errors
-    async def _process(self, id: str, shards: list[Any]) -> None:
+    async def _process(self, id: str, shards: list[object]) -> None:
         """Write one buffer to file
 
         This function was built to offload the disk IO, but since then we've
@@ -154,36 +152,30 @@ async def _process(self, id: str, shards: list[Any]) -> None:
         future then we should consider simplifying this considerably and
         dropping the write into communicate above.
         """
-        frames: Iterable[bytes | bytearray | memoryview]
-        if isinstance(shards[0], bytes):
-            # Manually serialized dataframes
-            frames = shards
-            serialize_meter_ctx: Any = empty_context
-        else:
-            # Unserialized numpy arrays
-            # Note: no calls to pickle_bytelist will happen until we actually start
-            # writing to disk below.
-            frames = concat(pickle_bytelist(shard) for shard in shards)
-            serialize_meter_ctx = context_meter.meter("serialize", func=thread_time)
+        nbytes_acc = 0
+
+        def pickle_and_tally() -> Iterator[bytes | memoryview]:
+            nonlocal nbytes_acc
+            for shard in shards:
+                for frame in pickle_bytelist(shard):
+                    nbytes_acc += nbytes(frame)
+                    yield frame
 
         with (
             self._directory_lock.read(),
             context_meter.meter("disk-write"),
-            serialize_meter_ctx,
+            context_meter.meter("serialize", func=thread_time),
         ):
-            # Consider boosting total_size a bit here to account for duplication
-            # We only need shared (i.e., read) access to the directory to write
-            # to a file inside of it.
             if self._closed:
                 raise RuntimeError("Already closed")
 
             with open(self.directory / str(id), mode="ab") as f:
-                f.writelines(frames)
+                f.writelines(pickle_and_tally())
 
         context_meter.digest_metric("disk-write", 1, "count")
-        context_meter.digest_metric("disk-write", sum(map(nbytes, frames)), "bytes")
+        context_meter.digest_metric("disk-write", nbytes_acc, "bytes")
 
-    def read(self, id: str) -> Any:
+    def read(self, id: str) -> list[Any]:
         """Read a complete file back into memory"""
         self.raise_on_exception()
         if not self._inputs_done:
@@ -210,6 +202,24 @@ def read(self, id: str) -> Any:
         else:
             raise DataUnavailable(id)
 
+    @staticmethod
+    def _read(path: Path) -> tuple[list[Any], int]:
+        """Open a memory-mapped file descriptor to disk, read all metadata, and unpickle
+        all arrays. This is a fast sequence of short reads interleaved with seeks.
+        Do not read in memory the actual data; the arrays' buffers will point to the
+        memory-mapped area.
+
+        The file descriptor will be automatically closed by the kernel when all the
+        returned arrays are dereferenced, which will happen after the call to
+        concatenate3.
+        """
+        with path.open(mode="r+b") as fh:
+            buffer = memoryview(mmap.mmap(fh.fileno(), 0))
+
+        # The file descriptor has *not* been closed!
+        shards = list(unpickle_bytestream(buffer))
+        return shards, buffer.nbytes
+
     async def close(self) -> None:
         await super().close()
         with self._directory_lock.write():