Skip to content
Permalink
main
Switch branches/tags

Name already in use

A tag already exists with the provided branch name. Many Git commands accept both tag and branch names, so creating this branch may cause unexpected behavior. Are you sure you want to create this branch?
Go to file
 
 
Cannot retrieve contributors at this time
{
"cells": [
{
"cell_type": "code",
"execution_count": 3,
"id": "9a3d1d4d-54e0-4725-933b-8337450f2df3",
"metadata": {
"id": "9a3d1d4d-54e0-4725-933b-8337450f2df3"
},
"outputs": [],
"source": [
"import pandas as pd\n",
"import torch.nn as nn\n",
"import torch\n",
"from datetime import datetime, timedelta\n",
"import numpy as np"
]
},
{
"cell_type": "markdown",
"id": "cc2e45cc-2981-4ff4-bbdd-b640b3bcbc37",
"metadata": {
"id": "cc2e45cc-2981-4ff4-bbdd-b640b3bcbc37"
},
"source": [
"## data processing"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "c421468f-c578-4583-8747-a30b5e2e8bf6",
"metadata": {
"id": "c421468f-c578-4583-8747-a30b5e2e8bf6"
},
"outputs": [],
"source": [
"!pwd"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "b298662f-dadb-451e-9ee7-8c6f2989d3b9",
"metadata": {
"id": "b298662f-dadb-451e-9ee7-8c6f2989d3b9"
},
"outputs": [],
"source": [
"# df = pd.read_csv(\"./data/scooter/E-Scooter_Trips_-_2020.csv\")"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "8af82379",
"metadata": {},
"outputs": [],
"source": [
"df = pd.read_csv(\"./data/E-Scooter_Trips_-_2020.csv\")"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "19665919-c190-4d8b-af25-b50998df6e20",
"metadata": {
"id": "19665919-c190-4d8b-af25-b50998df6e20"
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Trip ID</th>\n",
" <th>Start Time</th>\n",
" <th>End Time</th>\n",
" <th>Trip Distance</th>\n",
" <th>Trip Duration</th>\n",
" <th>Vendor</th>\n",
" <th>Start Community Area Number</th>\n",
" <th>End Community Area Number</th>\n",
" <th>Start Community Area Name</th>\n",
" <th>End Community Area Name</th>\n",
" <th>Start Centroid Latitude</th>\n",
" <th>Start Centroid Longitude</th>\n",
" <th>Start Centroid Location</th>\n",
" <th>End Centroid Latitude</th>\n",
" <th>End Centroid Longitude</th>\n",
" <th>End Centroid Location</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>3eb9a2a3-3266-4559-b1ec-e83a6f7972ab</td>\n",
" <td>08/12/2020 05:00:00 AM</td>\n",
" <td>08/12/2020 05:00:00 AM</td>\n",
" <td>1,153</td>\n",
" <td>1,027</td>\n",
" <td>spin</td>\n",
" <td>68.0</td>\n",
" <td>68.0</td>\n",
" <td>ENGLEWOOD</td>\n",
" <td>ENGLEWOOD</td>\n",
" <td>41.780068</td>\n",
" <td>-87.642266</td>\n",
" <td>POINT (-87.64226608 41.78006847)</td>\n",
" <td>41.780068</td>\n",
" <td>-87.642266</td>\n",
" <td>POINT (-87.64226608 41.78006847)</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>82dd7b8f-8de0-4f25-829b-b32bf47e8419</td>\n",
" <td>08/12/2020 05:00:00 AM</td>\n",
" <td>08/12/2020 05:00:00 AM</td>\n",
" <td>17</td>\n",
" <td>91</td>\n",
" <td>spin</td>\n",
" <td>22.0</td>\n",
" <td>21.0</td>\n",
" <td>LOGAN SQUARE</td>\n",
" <td>AVONDALE</td>\n",
" <td>41.922903</td>\n",
" <td>-87.704301</td>\n",
" <td>POINT (-87.70430082 41.92290349)</td>\n",
" <td>41.939283</td>\n",
" <td>-87.710757</td>\n",
" <td>POINT (-87.71075685 41.93928256)</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Trip ID Start Time \\\n",
"0 3eb9a2a3-3266-4559-b1ec-e83a6f7972ab 08/12/2020 05:00:00 AM \n",
"1 82dd7b8f-8de0-4f25-829b-b32bf47e8419 08/12/2020 05:00:00 AM \n",
"\n",
" End Time Trip Distance Trip Duration Vendor \\\n",
"0 08/12/2020 05:00:00 AM 1,153 1,027 spin \n",
"1 08/12/2020 05:00:00 AM 17 91 spin \n",
"\n",
" Start Community Area Number End Community Area Number \\\n",
"0 68.0 68.0 \n",
"1 22.0 21.0 \n",
"\n",
" Start Community Area Name End Community Area Name Start Centroid Latitude \\\n",
"0 ENGLEWOOD ENGLEWOOD 41.780068 \n",
"1 LOGAN SQUARE AVONDALE 41.922903 \n",
"\n",
" Start Centroid Longitude Start Centroid Location \\\n",
"0 -87.642266 POINT (-87.64226608 41.78006847) \n",
"1 -87.704301 POINT (-87.70430082 41.92290349) \n",
"\n",
" End Centroid Latitude End Centroid Longitude \\\n",
"0 41.780068 -87.642266 \n",
"1 41.939283 -87.710757 \n",
"\n",
" End Centroid Location \n",
"0 POINT (-87.64226608 41.78006847) \n",
"1 POINT (-87.71075685 41.93928256) "
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.head(2)"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "3f056dce-a831-45de-8248-7e02fd953a7d",
"metadata": {
"id": "3f056dce-a831-45de-8248-7e02fd953a7d"
},
"outputs": [],
"source": [
"df = df.dropna()"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "e90ac011-2b64-4d37-9ac8-aa1385fd3122",
"metadata": {
"id": "e90ac011-2b64-4d37-9ac8-aa1385fd3122"
},
"outputs": [],
"source": [
"df = df.astype({\"Start Community Area Number\": int, \"End Community Area Number\": int})"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "f97344e1-77e2-4319-8ee1-183e735702da",
"metadata": {
"id": "f97344e1-77e2-4319-8ee1-183e735702da"
},
"outputs": [],
"source": [
"communities = set(df[\"Start Community Area Number\"].unique()) or set( df[\"End Community Area Number\"].unique())"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "c403e385-1f00-4dbc-a867-25d2e11b07d5",
"metadata": {
"id": "c403e385-1f00-4dbc-a867-25d2e11b07d5"
},
"outputs": [
{
"data": {
"text/plain": [
"77"
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(communities)"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "f38f6c51-859e-4a55-b6a5-20e68b18252a",
"metadata": {
"id": "f38f6c51-859e-4a55-b6a5-20e68b18252a"
},
"outputs": [],
"source": [
"df[\"Start Time\"] = pd.to_datetime(df[\"Start Time\"])"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "b0b94d62-a159-4b8c-98eb-a11b4ff4adcc",
"metadata": {
"id": "b0b94d62-a159-4b8c-98eb-a11b4ff4adcc"
},
"outputs": [],
"source": [
"df[\"End Time\"] = pd.to_datetime(df[\"End Time\"])"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "f960381b-e875-4d8e-bcf8-60f786128e28",
"metadata": {
"id": "f960381b-e875-4d8e-bcf8-60f786128e28",
"scrolled": true
},
"outputs": [
{
"data": {
"text/plain": [
"Trip ID object\n",
"Start Time datetime64[ns]\n",
"End Time datetime64[ns]\n",
"Trip Distance object\n",
"Trip Duration object\n",
"Vendor object\n",
"Start Community Area Number int32\n",
"End Community Area Number int32\n",
"Start Community Area Name object\n",
"End Community Area Name object\n",
"Start Centroid Latitude float64\n",
"Start Centroid Longitude float64\n",
"Start Centroid Location object\n",
"End Centroid Latitude float64\n",
"End Centroid Longitude float64\n",
"End Centroid Location object\n",
"dtype: object"
]
},
"execution_count": 14,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.dtypes"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "dde242e4-6720-40b4-9ddc-6f54d93cbb20",
"metadata": {
"id": "dde242e4-6720-40b4-9ddc-6f54d93cbb20"
},
"outputs": [
{
"data": {
"text/plain": [
"(Timestamp('2020-08-12 05:00:00'),\n",
" Timestamp('2020-12-12 21:00:00'),\n",
" Timestamp('2020-08-12 05:00:00'),\n",
" Timestamp('2020-12-12 22:00:00'))"
]
},
"execution_count": 15,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df[\"Start Time\"].min(), df[\"Start Time\"].max(), df[\"End Time\"].min(), df[\"End Time\"].max()"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "e11d210a-d174-4529-925a-29ddc86bb9d6",
"metadata": {
"id": "e11d210a-d174-4529-925a-29ddc86bb9d6"
},
"outputs": [],
"source": [
"community_map = {key: value for value, key in enumerate(communities)}"
]
},
{
"cell_type": "code",
"execution_count": 17,
"id": "f782954d-48ec-4c09-a3cb-2b2927cc0c98",
"metadata": {
"id": "f782954d-48ec-4c09-a3cb-2b2927cc0c98"
},
"outputs": [],
"source": [
"from datetime import datetime\n",
"start = datetime(year = 2020, month = 8, day = 12, hour = 0, minute = 0, second = 0)\n",
"end = datetime(year = 2020, month = 12, day = 12, hour = 0, minute = 0, second = 0)"
]
},
{
"cell_type": "code",
"execution_count": 18,
"id": "d07ede9b-7a8d-4a1e-9eaf-432d2478f22b",
"metadata": {
"id": "d07ede9b-7a8d-4a1e-9eaf-432d2478f22b"
},
"outputs": [
{
"data": {
"text/plain": [
"(datetime.datetime(2020, 8, 12, 0, 0), datetime.datetime(2020, 12, 12, 0, 0))"
]
},
"execution_count": 18,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"start, end"
]
},
{
"cell_type": "code",
"execution_count": 19,
"id": "1a9b13f8-2a1f-4eef-8503-993a753e5606",
"metadata": {
"id": "1a9b13f8-2a1f-4eef-8503-993a753e5606"
},
"outputs": [
{
"data": {
"text/plain": [
"2928.0"
]
},
"execution_count": 19,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"(end - start).total_seconds()/(60 * 60)"
]
},
{
"cell_type": "code",
"execution_count": 20,
"id": "f3dedc91-bf17-4f7a-81c2-a3d3648a4d72",
"metadata": {
"id": "f3dedc91-bf17-4f7a-81c2-a3d3648a4d72"
},
"outputs": [
{
"data": {
"text/plain": [
"2952"
]
},
"execution_count": 20,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"2928 + 24"
]
},
{
"cell_type": "code",
"execution_count": 21,
"id": "8ad49821-b152-4227-81fb-40b2687d71c8",
"metadata": {
"id": "8ad49821-b152-4227-81fb-40b2687d71c8"
},
"outputs": [],
"source": [
"df[\"start_midx\"] = df[\"Start Community Area Number\"].map(community_map)\n",
"df[\"end_midx\"] = df[\"End Community Area Number\"].map(community_map)"
]
},
{
"cell_type": "code",
"execution_count": 22,
"id": "93d4c5cb-a009-49ab-9631-0b90dd06dad0",
"metadata": {
"id": "93d4c5cb-a009-49ab-9631-0b90dd06dad0"
},
"outputs": [],
"source": [
"start_trips = pd.DataFrame(df.groupby([\"Start Time\", \"start_midx\"])[\"Trip ID\"].count())"
]
},
{
"cell_type": "code",
"execution_count": 23,
"id": "b543c975-204b-4c2c-acd8-75bab929da80",
"metadata": {
"id": "b543c975-204b-4c2c-acd8-75bab929da80"
},
"outputs": [],
"source": [
"end_trips = pd.DataFrame(df.groupby([\"End Time\", \"end_midx\"])[\"Trip ID\"].count())"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "f9651eea-5181-4ae5-a342-6e622076ae02",
"metadata": {
"id": "f9651eea-5181-4ae5-a342-6e622076ae02"
},
"outputs": [],
"source": [
"trips.loc[(y[0], 15)][0]"
]
},
{
"cell_type": "code",
"execution_count": 31,
"id": "fe68a2f9-034d-4aea-9fa8-ac147f88a1c8",
"metadata": {
"id": "fe68a2f9-034d-4aea-9fa8-ac147f88a1c8"
},
"outputs": [],
"source": [
"map_shape = (7,11)\n",
"num_map_element = map_shape[0] * map_shape[1]\n",
"in_map = np.zeros(num_map_element)\n"
]
},
{
"cell_type": "code",
"execution_count": 32,
"id": "e118c0a4-60e4-413a-8d12-39ca32f646aa",
"metadata": {
"id": "e118c0a4-60e4-413a-8d12-39ca32f646aa"
},
"outputs": [
{
"data": {
"text/plain": [
"array([[0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],\n",
" [0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],\n",
" [0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],\n",
" [0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],\n",
" [0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],\n",
" [0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],\n",
" [0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.]])"
]
},
"execution_count": 32,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"in_map.reshape(map_shape)"
]
},
{
"cell_type": "code",
"execution_count": 33,
"id": "175845f6-2893-49f6-a7a8-4f24f17db903",
"metadata": {
"id": "175845f6-2893-49f6-a7a8-4f24f17db903"
},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"C:\\Users\\yy\\AppData\\Local\\Temp\\ipykernel_39464\\2680085065.py:14: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
" check_in_map[j] = start_trips.loc[(time, j)][0]\n",
"C:\\Users\\yy\\AppData\\Local\\Temp\\ipykernel_39464\\2680085065.py:19: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
" check_out_map[j] = end_trips.loc[(time, j)][0]\n"
]
}
],
"source": [
"from datetime import datetime, timedelta\n",
"import numpy as np\n",
"\n",
"timeslots = []\n",
"time_clips = []\n",
"\n",
"for i in range(2952):\n",
" time = start + timedelta(hours=i)\n",
" timeslots.append(time)\n",
" check_in_map = np.zeros(num_map_element)\n",
" check_out_map = np.zeros(num_map_element)\n",
" for j in range(num_map_element):\n",
" try:\n",
" check_in_map[j] = start_trips.loc[(time, j)][0]\n",
" except:\n",
" continue\n",
"\n",
" try:\n",
" check_out_map[j] = end_trips.loc[(time, j)][0]\n",
" except:\n",
" continue\n",
"\n",
" check_in_map = check_in_map.reshape(map_shape)\n",
" check_out_map = check_out_map.reshape(map_shape)\n",
"\n",
" time_clips.append((check_in_map, check_out_map))"
]
},
{
"cell_type": "code",
"execution_count": 34,
"id": "fac14eaa-6b8a-404c-a3a7-6d2342836646",
"metadata": {
"id": "fac14eaa-6b8a-404c-a3a7-6d2342836646"
},
"outputs": [
{
"data": {
"text/plain": [
"datetime.datetime(2020, 12, 12, 23, 0)"
]
},
"execution_count": 34,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"timeslots[-1]"
]
},
{
"cell_type": "code",
"execution_count": 35,
"id": "1cc1205f-8246-425e-9435-0b9011cca921",
"metadata": {
"id": "1cc1205f-8246-425e-9435-0b9011cca921"
},
"outputs": [],
"source": [
"data = np.array(time_clips)"
]
},
{
"cell_type": "code",
"execution_count": 36,
"id": "35867474-d779-4eaa-b0ad-864bb2a41e65",
"metadata": {
"id": "35867474-d779-4eaa-b0ad-864bb2a41e65"
},
"outputs": [
{
"data": {
"text/plain": [
"(2952, 2, 7, 11)"
]
},
"execution_count": 36,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data.shape"
]
},
{
"cell_type": "code",
"execution_count": 37,
"id": "74442b4c-ed9a-4baa-8bb6-6b2527ff08fc",
"metadata": {
"id": "74442b4c-ed9a-4baa-8bb6-6b2527ff08fc"
},
"outputs": [],
"source": [
"np.save(\"./scooter_data\", data)"
]
},
{
"cell_type": "code",
"execution_count": 40,
"id": "44960cb7-8949-4df2-99a5-d00865e94004",
"metadata": {
"id": "44960cb7-8949-4df2-99a5-d00865e94004"
},
"outputs": [
{
"data": {
"text/plain": [
"(2952, 2, 7, 11)"
]
},
"execution_count": 40,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data = np.load(\"./scooter_data.npy\")\n",
"data.shape"
]
},
{
"cell_type": "code",
"execution_count": 55,
"id": "931b1817",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"[<matplotlib.lines.Line2D at 0x1a4cd32a0e0>]"
]
},
"execution_count": 55,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "",
"text/plain": [
"<Figure size 640x480 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"\n",
"test_data = data[:100,1,0,2]\n",
"import matplotlib.pyplot as plt\n",
"plt.plot(test_data)"
]
},
{
"cell_type": "code",
"execution_count": 56,
"id": "cf9e6d94",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Trip ID</th>\n",
" <th>Start Time</th>\n",
" <th>End Time</th>\n",
" <th>Trip Distance</th>\n",
" <th>Trip Duration</th>\n",
" <th>Vendor</th>\n",
" <th>Start Community Area Number</th>\n",
" <th>End Community Area Number</th>\n",
" <th>Start Community Area Name</th>\n",
" <th>End Community Area Name</th>\n",
" <th>Start Centroid Latitude</th>\n",
" <th>Start Centroid Longitude</th>\n",
" <th>Start Centroid Location</th>\n",
" <th>End Centroid Latitude</th>\n",
" <th>End Centroid Longitude</th>\n",
" <th>End Centroid Location</th>\n",
" <th>start_midx</th>\n",
" <th>end_midx</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>3eb9a2a3-3266-4559-b1ec-e83a6f7972ab</td>\n",
" <td>2020-08-12 05:00:00</td>\n",
" <td>2020-08-12 05:00:00</td>\n",
" <td>1,153</td>\n",
" <td>1,027</td>\n",
" <td>spin</td>\n",
" <td>68</td>\n",
" <td>68</td>\n",
" <td>ENGLEWOOD</td>\n",
" <td>ENGLEWOOD</td>\n",
" <td>41.780068</td>\n",
" <td>-87.642266</td>\n",
" <td>POINT (-87.64226608 41.78006847)</td>\n",
" <td>41.780068</td>\n",
" <td>-87.642266</td>\n",
" <td>POINT (-87.64226608 41.78006847)</td>\n",
" <td>67</td>\n",
" <td>67</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>82dd7b8f-8de0-4f25-829b-b32bf47e8419</td>\n",
" <td>2020-08-12 05:00:00</td>\n",
" <td>2020-08-12 05:00:00</td>\n",
" <td>17</td>\n",
" <td>91</td>\n",
" <td>spin</td>\n",
" <td>22</td>\n",
" <td>21</td>\n",
" <td>LOGAN SQUARE</td>\n",
" <td>AVONDALE</td>\n",
" <td>41.922903</td>\n",
" <td>-87.704301</td>\n",
" <td>POINT (-87.70430082 41.92290349)</td>\n",
" <td>41.939283</td>\n",
" <td>-87.710757</td>\n",
" <td>POINT (-87.71075685 41.93928256)</td>\n",
" <td>21</td>\n",
" <td>20</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>9120cbf3-f749-49b6-b894-0e6e065cd731</td>\n",
" <td>2020-08-12 05:00:00</td>\n",
" <td>2020-08-12 05:00:00</td>\n",
" <td>2,883</td>\n",
" <td>724</td>\n",
" <td>spin</td>\n",
" <td>3</td>\n",
" <td>6</td>\n",
" <td>UPTOWN</td>\n",
" <td>LAKE VIEW</td>\n",
" <td>41.965435</td>\n",
" <td>-87.655145</td>\n",
" <td>POINT (-87.65514456 41.96543532)</td>\n",
" <td>41.943514</td>\n",
" <td>-87.657498</td>\n",
" <td>POINT (-87.65749768 41.9435138)</td>\n",
" <td>2</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>cf2e4abc-2649-49be-924b-468a1aefc4c8</td>\n",
" <td>2020-08-12 05:00:00</td>\n",
" <td>2020-08-12 05:00:00</td>\n",
" <td>5</td>\n",
" <td>21</td>\n",
" <td>spin</td>\n",
" <td>31</td>\n",
" <td>31</td>\n",
" <td>LOWER WEST SIDE</td>\n",
" <td>LOWER WEST SIDE</td>\n",
" <td>41.848335</td>\n",
" <td>-87.675179</td>\n",
" <td>POINT (-87.67517932 41.84833501)</td>\n",
" <td>41.848335</td>\n",
" <td>-87.675179</td>\n",
" <td>POINT (-87.67517932 41.84833501)</td>\n",
" <td>30</td>\n",
" <td>30</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>0448afb5-ab64-4090-b528-e3050e7eb0f2</td>\n",
" <td>2020-08-12 07:00:00</td>\n",
" <td>2020-08-12 07:00:00</td>\n",
" <td>1,179</td>\n",
" <td>245</td>\n",
" <td>spin</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>LAKE VIEW</td>\n",
" <td>LAKE VIEW</td>\n",
" <td>41.943514</td>\n",
" <td>-87.657498</td>\n",
" <td>POINT (-87.65749768 41.9435138)</td>\n",
" <td>41.943514</td>\n",
" <td>-87.657498</td>\n",
" <td>POINT (-87.65749768 41.9435138)</td>\n",
" <td>5</td>\n",
" <td>5</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>630811</th>\n",
" <td>2c648499-436a-4244-bf2b-ce0041ee4129</td>\n",
" <td>2020-12-12 21:00:00</td>\n",
" <td>2020-12-12 22:00:00</td>\n",
" <td>4,226</td>\n",
" <td>1,327</td>\n",
" <td>lime</td>\n",
" <td>11</td>\n",
" <td>11</td>\n",
" <td>JEFFERSON PARK</td>\n",
" <td>JEFFERSON PARK</td>\n",
" <td>41.978727</td>\n",
" <td>-87.768147</td>\n",
" <td>POINT (-87.76814656 41.97872681)</td>\n",
" <td>41.978727</td>\n",
" <td>-87.768147</td>\n",
" <td>POINT (-87.76814656 41.97872681)</td>\n",
" <td>10</td>\n",
" <td>10</td>\n",
" </tr>\n",
" <tr>\n",
" <th>630812</th>\n",
" <td>72119cd3-18db-4a08-8da7-1639a6894a18</td>\n",
" <td>2020-12-12 21:00:00</td>\n",
" <td>2020-12-12 21:00:00</td>\n",
" <td>1,822</td>\n",
" <td>211</td>\n",
" <td>spin</td>\n",
" <td>3</td>\n",
" <td>3</td>\n",
" <td>UPTOWN</td>\n",
" <td>UPTOWN</td>\n",
" <td>41.965435</td>\n",
" <td>-87.655145</td>\n",
" <td>POINT (-87.65514456 41.96543532)</td>\n",
" <td>41.965435</td>\n",
" <td>-87.655145</td>\n",
" <td>POINT (-87.65514456 41.96543532)</td>\n",
" <td>2</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>630813</th>\n",
" <td>1e01298b-75e3-4a22-b440-388b093f7202</td>\n",
" <td>2020-12-12 21:00:00</td>\n",
" <td>2020-12-12 22:00:00</td>\n",
" <td>878</td>\n",
" <td>325</td>\n",
" <td>lime</td>\n",
" <td>28</td>\n",
" <td>24</td>\n",
" <td>NEAR WEST SIDE</td>\n",
" <td>WEST TOWN</td>\n",
" <td>41.874254</td>\n",
" <td>-87.664619</td>\n",
" <td>POINT (-87.66461906 41.87425419)</td>\n",
" <td>41.901459</td>\n",
" <td>-87.675568</td>\n",
" <td>POINT (-87.67556756 41.90145875)</td>\n",
" <td>27</td>\n",
" <td>23</td>\n",
" </tr>\n",
" <tr>\n",
" <th>630814</th>\n",
" <td>cce935b2-3dc8-4e06-b913-a1fd37c652d0</td>\n",
" <td>2020-12-12 21:00:00</td>\n",
" <td>2020-12-12 22:00:00</td>\n",
" <td>294</td>\n",
" <td>1,332</td>\n",
" <td>bird</td>\n",
" <td>7</td>\n",
" <td>7</td>\n",
" <td>LINCOLN PARK</td>\n",
" <td>LINCOLN PARK</td>\n",
" <td>41.921880</td>\n",
" <td>-87.645647</td>\n",
" <td>POINT (-87.64564651 41.92188043)</td>\n",
" <td>41.921880</td>\n",
" <td>-87.645647</td>\n",
" <td>POINT (-87.64564651 41.92188043)</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" </tr>\n",
" <tr>\n",
" <th>630815</th>\n",
" <td>758cd2bd-45da-4c2c-b73a-8a07de69bd22</td>\n",
" <td>2020-12-12 21:00:00</td>\n",
" <td>2020-12-12 22:00:00</td>\n",
" <td>5,403</td>\n",
" <td>2,341</td>\n",
" <td>spin</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>LAKE VIEW</td>\n",
" <td>LAKE VIEW</td>\n",
" <td>41.943514</td>\n",
" <td>-87.657498</td>\n",
" <td>POINT (-87.65749768 41.9435138)</td>\n",
" <td>41.943514</td>\n",
" <td>-87.657498</td>\n",
" <td>POINT (-87.65749768 41.9435138)</td>\n",
" <td>5</td>\n",
" <td>5</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>629175 rows × 18 columns</p>\n",
"</div>"
],
"text/plain": [
" Trip ID Start Time \\\n",
"0 3eb9a2a3-3266-4559-b1ec-e83a6f7972ab 2020-08-12 05:00:00 \n",
"1 82dd7b8f-8de0-4f25-829b-b32bf47e8419 2020-08-12 05:00:00 \n",
"2 9120cbf3-f749-49b6-b894-0e6e065cd731 2020-08-12 05:00:00 \n",
"3 cf2e4abc-2649-49be-924b-468a1aefc4c8 2020-08-12 05:00:00 \n",
"4 0448afb5-ab64-4090-b528-e3050e7eb0f2 2020-08-12 07:00:00 \n",
"... ... ... \n",
"630811 2c648499-436a-4244-bf2b-ce0041ee4129 2020-12-12 21:00:00 \n",
"630812 72119cd3-18db-4a08-8da7-1639a6894a18 2020-12-12 21:00:00 \n",
"630813 1e01298b-75e3-4a22-b440-388b093f7202 2020-12-12 21:00:00 \n",
"630814 cce935b2-3dc8-4e06-b913-a1fd37c652d0 2020-12-12 21:00:00 \n",
"630815 758cd2bd-45da-4c2c-b73a-8a07de69bd22 2020-12-12 21:00:00 \n",
"\n",
" End Time Trip Distance Trip Duration Vendor \\\n",
"0 2020-08-12 05:00:00 1,153 1,027 spin \n",
"1 2020-08-12 05:00:00 17 91 spin \n",
"2 2020-08-12 05:00:00 2,883 724 spin \n",
"3 2020-08-12 05:00:00 5 21 spin \n",
"4 2020-08-12 07:00:00 1,179 245 spin \n",
"... ... ... ... ... \n",
"630811 2020-12-12 22:00:00 4,226 1,327 lime \n",
"630812 2020-12-12 21:00:00 1,822 211 spin \n",
"630813 2020-12-12 22:00:00 878 325 lime \n",
"630814 2020-12-12 22:00:00 294 1,332 bird \n",
"630815 2020-12-12 22:00:00 5,403 2,341 spin \n",
"\n",
" Start Community Area Number End Community Area Number \\\n",
"0 68 68 \n",
"1 22 21 \n",
"2 3 6 \n",
"3 31 31 \n",
"4 6 6 \n",
"... ... ... \n",
"630811 11 11 \n",
"630812 3 3 \n",
"630813 28 24 \n",
"630814 7 7 \n",
"630815 6 6 \n",
"\n",
" Start Community Area Name End Community Area Name \\\n",
"0 ENGLEWOOD ENGLEWOOD \n",
"1 LOGAN SQUARE AVONDALE \n",
"2 UPTOWN LAKE VIEW \n",
"3 LOWER WEST SIDE LOWER WEST SIDE \n",
"4 LAKE VIEW LAKE VIEW \n",
"... ... ... \n",
"630811 JEFFERSON PARK JEFFERSON PARK \n",
"630812 UPTOWN UPTOWN \n",
"630813 NEAR WEST SIDE WEST TOWN \n",
"630814 LINCOLN PARK LINCOLN PARK \n",
"630815 LAKE VIEW LAKE VIEW \n",
"\n",
" Start Centroid Latitude Start Centroid Longitude \\\n",
"0 41.780068 -87.642266 \n",
"1 41.922903 -87.704301 \n",
"2 41.965435 -87.655145 \n",
"3 41.848335 -87.675179 \n",
"4 41.943514 -87.657498 \n",
"... ... ... \n",
"630811 41.978727 -87.768147 \n",
"630812 41.965435 -87.655145 \n",
"630813 41.874254 -87.664619 \n",
"630814 41.921880 -87.645647 \n",
"630815 41.943514 -87.657498 \n",
"\n",
" Start Centroid Location End Centroid Latitude \\\n",
"0 POINT (-87.64226608 41.78006847) 41.780068 \n",
"1 POINT (-87.70430082 41.92290349) 41.939283 \n",
"2 POINT (-87.65514456 41.96543532) 41.943514 \n",
"3 POINT (-87.67517932 41.84833501) 41.848335 \n",
"4 POINT (-87.65749768 41.9435138) 41.943514 \n",
"... ... ... \n",
"630811 POINT (-87.76814656 41.97872681) 41.978727 \n",
"630812 POINT (-87.65514456 41.96543532) 41.965435 \n",
"630813 POINT (-87.66461906 41.87425419) 41.901459 \n",
"630814 POINT (-87.64564651 41.92188043) 41.921880 \n",
"630815 POINT (-87.65749768 41.9435138) 41.943514 \n",
"\n",
" End Centroid Longitude End Centroid Location start_midx \\\n",
"0 -87.642266 POINT (-87.64226608 41.78006847) 67 \n",
"1 -87.710757 POINT (-87.71075685 41.93928256) 21 \n",
"2 -87.657498 POINT (-87.65749768 41.9435138) 2 \n",
"3 -87.675179 POINT (-87.67517932 41.84833501) 30 \n",
"4 -87.657498 POINT (-87.65749768 41.9435138) 5 \n",
"... ... ... ... \n",
"630811 -87.768147 POINT (-87.76814656 41.97872681) 10 \n",
"630812 -87.655145 POINT (-87.65514456 41.96543532) 2 \n",
"630813 -87.675568 POINT (-87.67556756 41.90145875) 27 \n",
"630814 -87.645647 POINT (-87.64564651 41.92188043) 6 \n",
"630815 -87.657498 POINT (-87.65749768 41.9435138) 5 \n",
"\n",
" end_midx \n",
"0 67 \n",
"1 20 \n",
"2 5 \n",
"3 30 \n",
"4 5 \n",
"... ... \n",
"630811 10 \n",
"630812 2 \n",
"630813 23 \n",
"630814 6 \n",
"630815 5 \n",
"\n",
"[629175 rows x 18 columns]"
]
},
"execution_count": 56,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "1282a1e9",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"colab": {
"provenance": []
},
"kernelspec": {
"display_name": "py310",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.10.13"
}
},
"nbformat": 4,
"nbformat_minor": 5
}