-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathPP2_Data_Analysis.sql
55 lines (47 loc) · 2.17 KB
/
PP2_Data_Analysis.sql
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
-- Data Analysis
-- bikes types used by riders
SELECT member_casual, rideable_type, COUNT(*) AS total_trips
FROM `2020_cyclistic_data.2020_cyclistic_cleaned_merged_data`
GROUP BY member_casual, rideable_type
ORDER BY member_casual, total_trips;
-- no. of trips per month
SELECT month, member_casual, COUNT(ride_id) AS no_of_trips_per_month
FROM `2020_cyclistic_data.2020_cyclistic_cleaned_merged_data`
GROUP BY month, member_casual
ORDER BY member_casual;
-- no. of trips per days of the week
SELECT day_of_week, member_casual, COUNT(ride_id) AS no_of_trips_per_day_of_week
FROM `2020_cyclistic_data.2020_cyclistic_cleaned_merged_data`
GROUP BY day_of_week, member_casual
ORDER BY member_casual;
-- no. of trips per hour
SELECT EXTRACT(HOUR FROM started_at) AS hour_of_day, member_casual, COUNT(ride_id) AS no_of_trips_per_hour
FROM `2020_cyclistic_data.2020_cyclistic_cleaned_merged_data`
GROUP BY hour_of_day, member_casual
ORDER BY member_casual;
-- average ride_length per month
SELECT month, member_casual, AVG(ride_length) AS avg_ride_duration
FROM `2020_cyclistic_data.2020_cyclistic_cleaned_merged_data`
GROUP BY month, member_casual;
-- average ride_length per day_of_week
SELECT day_of_week, member_casual, AVG(ride_length) AS avg_ride_duration
FROM `2020_cyclistic_data.2020_cyclistic_cleaned_merged_data`
GROUP BY day_of_week, member_casual
ORDER BY day_of_week;
-- average ride_length per hour
SELECT EXTRACT(HOUR FROM started_at) AS hour_of_day, member_casual, AVG(ride_length) AS avg_ride_duration
FROM `2020_cyclistic_data.2020_cyclistic_cleaned_merged_data`
GROUP BY hour_of_day, member_casual
ORDER BY member_casual;
-- starting station locations
SELECT start_station_name, member_casual,
AVG(start_lat) AS start_lat, AVG(start_lng) AS start_lng,
COUNT(ride_id) AS total_trips
FROM `2020_cyclistic_data.2020_cyclistic_cleaned_merged_data`
GROUP BY start_station_name, member_casual;
-- ending station locations
SELECT end_station_name, member_casual,
AVG(end_lat) AS end_lat, AVG(end_lng) AS end_lng,
COUNT(ride_id) AS total_trips
FROM `2020_cyclistic_data.2020_cyclistic_cleaned_merged_data`
GROUP BY end_station_name, member_casual;