#!/usr/bin/env python # coding: utf-8 # ## Dask Array scales NumPy # # Dask array implements the NumPy API. It is composed of many small NumPy arrays # # # In[ ]: from dask_kubernetes import KubeCluster cluster = KubeCluster(n_workers=10) cluster # In[ ]: from dask.distributed import Client client = Client(cluster) client # In[ ]: import dask.array as da x = da.random.random((20000, 20000), chunks=(2000, 2000)).persist() x # In[ ]: x[0, :5].compute() # In[ ]: x.sum().compute() # In[ ]: y = x + x.T - x.mean(axis=0) y = y.persist() # In[ ]: y # In[ ]: y[:5, :5].compute() # In[ ]: