dask · gjoseph92 · Sep 17, 2021 · Sep 17, 2021 · Sep 17, 2021 · May 4, 2022
@@ -2687,7 +2687,8 @@ def get_comm_cost(self, ts: TaskState, ws: WorkerState) -> float:
         nbytes: int = 0
         for dts in deps:
             nbytes += dts.nbytes
-        return nbytes / self.bandwidth
+        # Add a fixed 10ms penalty per transfer. See distributed#5324
+        return nbytes / self._bandwidth + 0.01 * len(deps)
 
     def get_task_duration(self, ts: TaskState) -> float:
         """Get the estimated computation cost of the given task (not including
@@ -2799,13 +2800,16 @@ def worker_objective(self, ts: TaskState, ws: WorkerState) -> tuple:
         """
         dts: TaskState
         comm_bytes: int = 0
+        xfers: int = 0
         for dts in ts.dependencies:
             if ws not in dts.who_has:
                 nbytes = dts.get_nbytes()
-                comm_bytes += nbytes
+                # amortize transfer cost over all waiters
+                comm_bytes += nbytes / len(dts.waiters)
+                xfers += 1
-                # amortize transfer cost over all waiters
-                comm_bytes += nbytes / len(dts.waiters)
-                xfers += 1
+                nwaiters = len(dts.waiters)
+                # amortize transfer cost over all waiters
+                comm_bytes += nbytes / nwaiters
+                xfers += 1 / nwaiters
-                # amortize transfer cost over all waiters
-                comm_bytes += nbytes / len(dts.waiters)
-                xfers += 1
+                nwaiters = len(dts.waiters)
+                # amortize transfer cost over all waiters
+                comm_bytes += nbytes / nwaiters
+                xfers += 1 / nwaiters
 
-        stack_time: float = ws.occupancy / ws.nthreads
-        start_time: float = stack_time + comm_bytes / self.bandwidth
+        stack_time: double = ws.occupancy / ws.nthreads
+        start_time: double = stack_time + comm_bytes / self.bandwidth + xfers * 0.01
 
         if ts.actor:
             return (len(ws.actors), start_time, ws.nbytes)