%matplotlib inline
# Dependencies and Setup
import matplotlib.pyplot as plt
import pandas as pd
import numpy as np

# File to Load (Remember to change these)
city_data_to_load = "data/city_data.csv"
ride_data_to_load = "data/ride_data.csv"

# Read the City and Ride Data
dfa = pd.read_csv(city_data_to_load)
dfb = pd.read_csv(ride_data_to_load)

dfc = pd.merge(dfb, dfa, how='left')
dfc.head()

Bubble Plot of Ride Sharing Data¶

dfc_grouped = dfc.groupby(['type','city'])

ride_counts = dfc_grouped['ride_id'].count()
just_urban_ride_counts = ride_counts.loc['Urban']
just_suburban_ride_counts = ride_counts.loc['Suburban']
just_rural_ride_counts = ride_counts.loc['Rural']

average_fares = dfc_grouped['fare'].mean()
just_urban_fares = average_fares.loc['Urban']
just_suburban_fares = average_fares.loc['Suburban']
just_rural_fares = average_fares.loc['Rural']

drivers_counts = dfc_grouped['driver_count'].sum() / dfc_grouped['driver_count'].count()
just_urban_drivers_counts = drivers_counts.loc['Urban']
just_suburban_drivers_counts = drivers_counts.loc['Suburban']
just_rural_drivers_counts = drivers_counts.loc['Rural']

plt.scatter(just_urban_ride_counts, just_urban_fares, s=just_urban_drivers_counts * 10, c = 'orange', alpha = 0.8, edgecolors = 'black')
plt.scatter(just_suburban_ride_counts, just_suburban_fares, s=just_suburban_drivers_counts * 10, c = 'blue', alpha = 0.8, edgecolors = 'black')
plt.scatter(just_rural_ride_counts, just_rural_fares, s=just_rural_drivers_counts * 10, c = 'gold', alpha = 0.8, edgecolors = 'black')
plt.legend(loc='upper right', labels = ['Urban', 'Suburban', 'Rural'], title = 'City Types')
plt.title('Pyber Ride Sharing Data (2016)')
plt.ylabel('Average Fare ($)')
plt.xlabel('Total Number of Rides (Per City)')
plt.grid(True)

plt.savefig("../Images/Ride.png")

Total Fares by City Type¶

total_fares = dfc_grouped['fare'].sum()

just_urban_fares_sum = total_fares.loc['Urban'].sum()
just_suburban_fares_sum = total_fares.loc['Suburban'].sum()
just_rural_fares_sum = total_fares.loc['Rural'].sum()

fares_sum_list = [just_urban_fares_sum, just_rural_fares_sum, just_suburban_fares_sum]
explode1 = [0.1, 0, 0]
labels = ['Urban', 'Rural', 'Suburban']
colors = ['#f28383', '#f6cf05', '#84cbfb']


plt.axis('equal')
plt.pie(fares_sum_list, explode = explode1, labels = labels, colors = colors, autopct="%1.1f%%", shadow = True, startangle = 290)
plt.title('% of Total Fares by City Type')
plt.show()

plt.savefig("../Images/FaresSumPie.png")

<Figure size 432x288 with 0 Axes>

Total Rides by City Type¶

just_urban_ride_counts_sum = ride_counts.loc['Urban'].sum()
just_suburban_ride_counts_sum = ride_counts.loc['Suburban'].sum()
just_rural_ride_counts_sum = ride_counts.loc['Rural'].sum()

sum_counts_list = [just_urban_ride_counts_sum, just_rural_ride_counts_sum, just_suburban_ride_counts_sum]
explode1 = [0.1, 0, 0]
labels = ['Urban', 'Rural', 'Suburban']
colors = ['#f28383', '#f6cf05', '#84cbfb']


plt.axis('equal')
plt.pie(sum_counts_list, explode = explode1, labels = labels, colors = colors, autopct="%1.1f%%", shadow = True, startangle = 260)
plt.title('% of Total Rides by City Type')
plt.show()

plt.savefig("../Images/RideCountPie.png")

<Figure size 432x288 with 0 Axes>

Total Drivers by City Type¶

just_urban_drivers_counts_sum = drivers_counts.loc['Urban'].sum()
just_suburban_drivers_counts_sum = drivers_counts.loc['Suburban'].sum()
just_rural_drivers_counts_sum = drivers_counts.loc['Rural'].sum()

drivers_sum_list = [just_urban_drivers_counts_sum, just_rural_drivers_counts_sum, just_suburban_drivers_counts_sum]
explode1 = [0.1, 0, 0]
labels = ['Urban', 'Rural', 'Suburban']
colors = ['#f28383', '#f6cf05', '#84cbfb']


plt.axis('equal')
plt.pie(drivers_sum_list, explode = explode1, labels = labels, colors = colors, autopct="%1.1f%%", shadow = True, startangle = 235)
plt.title('% of Total Drivers by City Type')
plt.show()

plt.savefig("../Images/DriverCountPie.png")

<Figure size 432x288 with 0 Axes>

	city	date	fare	ride_id	driver_count	type
0	Lake Jonathanshire	2018-01-14 10:14:22	13.83	5739410935873	5	Urban
1	South Michelleport	2018-03-04 18:24:09	30.24	2343912425577	72	Urban
2	Port Samanthamouth	2018-02-24 04:29:00	33.44	2005065760003	57	Urban
3	Rodneyfort	2018-02-10 23:22:03	23.44	5149245426178	34	Urban
4	South Jack	2018-03-06 04:28:35	34.58	3908451377344	46	Urban

Summary

Solution

Total Fares by City Type¶

Total Rides by City Type¶

Total Drivers by City Type¶