Cyclist Capstone Project
Data comparing casual and member bike riders in Chicago from 11/2021 - 10/2022
@kaggle.nixonthao_cyclist_capstone_project
Data comparing casual and member bike riders in Chicago from 11/2021 - 10/2022
@kaggle.nixonthao_cyclist_capstone_project
Here are 12 months of data on the divvy bicycle sharing service in Chicago. The data was combined to a data frame in which combined all the month's data into one. Therefore, the data was cleaned, organized, sorted, and filtered to find key takeaways on increase rental memberships.
Data is from November 2021 - October 2022
There are 13 columns:
RIDE_ID
RIDEABLE_TYPE
STARTED_AT
ENDED_AT
START_STATION_NAME
START_STATION_ID
END_STATION_NAME
END_STATION_ID
START_LAT
START_LNG
I added two columns, Ride_Length and WeekDays, in R to find more data for the business task.
Here are the files and overall markdown.
CREATE TABLE apr_2022 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE aug_2022 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE dec_2021 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE feb_2022 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE jan_2022 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE july_2022 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE june_2022 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE mar_2022 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE may_2022 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202111_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202112_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202201_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202202_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202203_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202204_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202205_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202206_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202207_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202208_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202209_divvy_publictripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE n_202210_divvy_tripdata (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE nov_2021 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE oct_2022 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
CREATE TABLE sept_2022 (
"ride_id" VARCHAR,
"rideable_type" VARCHAR,
"started_at" TIMESTAMP,
"ended_at" TIMESTAMP,
"start_station_name" VARCHAR,
"start_station_id" VARCHAR,
"end_station_name" VARCHAR,
"end_station_id" VARCHAR,
"start_lat" DOUBLE,
"start_lng" DOUBLE,
"end_lat" DOUBLE,
"end_lng" DOUBLE,
"member_casual" VARCHAR
);
Anyone who has the link will be able to view this.