import multiprocessing
from dask.distributed import Client, LocalCluster
Local cluster
Setup up local dask cluster
- possibly adjust number of threads per worker
- don’t forget to put the
Client(...)
in aif __name__ == "__main__"
context when running from a script
= multiprocessing.cpu_count()
n_workers
= 10 # how much memory will be spared from workers
mem_buffer
= 128 # total memory of machine
gb_total = gb_total - mem_buffer # what is left for dask
gb_available = int(gb_total / n_workers) # memory for each dask worker gb_per_worker
= Client(
client =LocalCluster(
address=n_workers,
n_workers=2,
threads_per_worker="lo",
interface=f"{gb_per_worker}GB",
memory_limit
) )
Inspect link to view dashboard
print(client.dashboard_link)
http://127.0.0.1:8787/status