Parallel programmeren met Dask in Python
James Fulton
Climate Informatics Researcher
dask.delayed()# Standaard gebruiken result = x.compute()result = dask.compute(x)# Threads gebruiken result = x.compute(scheduler='threads')result = dask.compute(x, scheduler='threads')# Processen gebruiken result = x.compute(scheduler='processes')result = dask.compute(x, scheduler='processes')
from dask.distributed import LocalCluster
cluster = LocalCluster(
processes=True,
n_workers=2,
threads_per_worker=2
)
print(cluster)
LocalCluster(..., workers=2, threads=4, memory=31.38 GiB)
from dask.distributed import LocalCluster
cluster = LocalCluster(
processes=False,
n_workers=2,
threads_per_worker=2
)
print(cluster)
LocalCluster(..., workers=2, threads=4, memory=31.38 GiB)
cluster = LocalCluster(processes=True)
print(cluster)
LocalCluster(..., workers=4 threads=8, memory=31.38 GiB)
cluster = LocalCluster(processes=False)
print(cluster)
LocalCluster(..., workers=1 threads=8, memory=31.38 GiB)
from dask.distributed import Client, LocalCluster
cluster = LocalCluster(
processes=True,
n_workers=4,
threads_per_worker=2
)
client = Client(cluster)
print(client)
<Client: 'tcp://127.0.0.1:61391' processes=4 threads=8, memory=31.38 GiB>
Maak eerst een cluster en geef die door aan de client
cluster = LocalCluster(
processes=True,
n_workers=4,
threads_per_worker=2
)
client = Client(cluster)
print(client)
<Client: ... processes=4 threads=8, ...>
Maak een client die zelf een cluster aanmaakt
client = Client(
processes=True,
n_workers=4,
threads_per_worker=2
)
print(client)
<Client: ... processes=4 threads=8, ...>
client = Client(processes=True) # Standaard gebruikt de client result = x.compute()# Je kunt een andere scheduler kiezen result = x.compute(scheduler='threads')# Client expliciet gebruiken kan ook result = client.compute(x)
LocalCluster() - Een cluster op je computer.Parallel programmeren met Dask in Python