Back to Modin

To run this notebook as done in the README GIFs, you must first locally download the 2015 NYC Taxi Trip Data.

examples/jupyter/Pandas_Taxi.ipynb

0.37.1618 B
Original Source
python
# To run this notebook as done in the README GIFs, you must first locally download the 2015 NYC Taxi Trip Data.
import urllib.request
url_path = "https://modin-datasets.intel.com/green-taxi/green_tripdata_2015-01.csv"
urllib.request.urlretrieve(url_path, "taxi.csv")

import warnings
warnings.filterwarnings("ignore")
python
import pandas as pd
python
%time df = pd.read_csv("taxi.csv", parse_dates=["tpep_pickup_datetime", "tpep_dropoff_datetime"], quoting=3)
python
%time isnull = df.isnull()
python
%time rounded_trip_distance = df[["pickup_longitude"]].applymap(round)