#!/usr/bin/env python # coding: utf-8 # In[1]: # To run this notebook as done in the README GIFs, you must first locally download the 2015 NYC Taxi Trip Data. import urllib.request url_path = "https://modin-test.s3.us-west-1.amazonaws.com/yellow_tripdata_2015-01.csv" urllib.request.urlretrieve(url_path, "taxi.csv") from modin.config import Engine Engine.put("dask") from dask.distributed import Client client = Client(n_workers=12) from modin.config import BenchmarkMode BenchmarkMode.put(True) # In[2]: import modin.pandas as pd # In[3]: get_ipython().run_line_magic('time', 'df = pd.read_csv("taxi.csv", parse_dates=["tpep_pickup_datetime", "tpep_dropoff_datetime"], quoting=3)') # In[4]: get_ipython().run_line_magic('time', 'isnull = df.isnull()') # In[5]: get_ipython().run_line_magic('time', 'rounded_trip_distance = df[["pickup_longitude"]].applymap(round)') # In[ ]: