Skip to content

Commit

Permalink
write rejections to csv
Browse files Browse the repository at this point in the history
  • Loading branch information
simei94 committed Nov 11, 2024
1 parent 9c198d1 commit 1c650bd
Showing 1 changed file with 44 additions and 40 deletions.
84 changes: 44 additions & 40 deletions src/main/R/badWeather/dataPrepare.R
Original file line number Diff line number Diff line change
Expand Up @@ -7,55 +7,36 @@ library(dplyr)


#read in ikoki data
ioki2020 <- read_csv2("C:/Users/Simon/Documents/shared-svn/projects/KelRide/data/KEXI/2021-04/IOKI_TABLEAU_Request_List_2020.csv")
ioki2021 <- read_csv2("C:/Users/Simon/Documents/shared-svn/projects/KelRide/data/KEXI/2021-05/IOKI_TABLEAU_Request_List_2021.csv")
ioki2020 <- read_csv2("../../shared-svn/projects/KelRide/data/KEXI/2021-04/IOKI_TABLEAU_Request_List_2020.csv")
ioki2021 <- read_csv2("../../shared-svn/projects/KelRide/data/KEXI/2021-05/IOKI_TABLEAU_Request_List_2021.csv")

ioki2020 <- ioki2020 %>% select(1:20,Passagieranzahl,`Nutzer ID`,`Fahrzeug ID`,`Eindeutige Anfrage`,Ersteller)

ioki2021 <- ioki2021 %>% anti_join(ioki2020, by = "Fahrt ID")
allData_ioki <- rbind(ioki2020,ioki2021)

# read in via data
via0621_0122 <- read_csv2("C:/Users/Simon/Documents/shared-svn/projects/KelRide/data/KEXI/Via_data_2022-02-08/Data_request_TUB_for_Kelheim-Actual_Data-VIA_edited.csv")
via0222_1022 <- read_csv2("C:/Users/Simon/Documents/shared-svn/projects/KelRide/data/KEXI/Via_data_2022-10-10/Data_request_TUB_for_Kelheim-Actual_Data-VIA_Feb_to_Oct_2022_edited_cleaned.csv")
via1022_1222 <- read_csv2("C:/Users/Simon/Documents/shared-svn/projects/KelRide/data/KEXI/Via_data_2023-01-17/Data_request_TUB_for_Kelheim-Actual_Data-Oct-Dec_2022-Data_TUB_for_Kelheim-Actual_Data-Oct_to_Dec_22_edited.csv")
via1222_0323 <- read_csv2("C:/Users/Simon/Documents/shared-svn/projects/KelRide/data/KEXI/Via_data_2023-04-19/Data_request_TUB_for_Kelheim-Actual_Data-Jan-Mar_2023-Kelheim-Actual_Data-Jan-Mar_2023_edited.csv")
via0323_0723 <- read_csv2("C:/Users/Simon/Documents/shared-svn/projects/KelRide/data/KEXI/Via_data_2023-07-10/Data_request_TUB_for_Kelheim-Actual_Data-Apr-Jul_2023-Kelheim-Actual_Data-Apr-Jul_23_edited.csv")
via0621_0624 <- read_csv2("../../shared-svn/projects/KelRide/data/KEXI/VIA_data/raw-data/Fahrtanfragen.csv")

via0621_0122 <- via0621_0122 %>%
select(Request.ID,Request.Status,Actual.Pickup.Time,Reason.For.Travel,Request.Creation.Time) %>%
mutate(Actual.Pickup.Time = ymd_hms(Actual.Pickup.Time))
# request id 5526535 has faulty request time
allData_via <- via0621_0624 %>%
filter(`Fahrtanfragen ID` != 5526535) %>%
mutate(Actual.Pickup.Time = ymd_hms(`Tatsächliche Einstiegszeit`),
Request.Creation.Time = ymd_hms(`Erstellungszeit der Fahrtanfrage`),
Request.ID = `Fahrtanfragen ID`,
Request.Status = `Status der Fahrtanfrage`,
Reason.For.Travel = `Grund für die Fahrt`) %>%
select(Request.ID,Request.Status,Actual.Pickup.Time,Reason.For.Travel,Request.Creation.Time) %>%
# Reason for travel is used to distinguish AV and conventional. the column was added after the av launch in 09-22
mutate(Reason.For.Travel = replace_na(Reason.For.Travel, "DR"))

via0222_1022 <- via0222_1022 %>%
select(Request.ID,Request.Status,Actual.Pickup.Time,Reason.For.Travel,Request.Creation.Time) %>%
mutate(Actual.Pickup.Time = ymd_hms(Actual.Pickup.Time), Request.Creation.Time = ymd_hms(Request.Creation.Time)) %>% anti_join(via0621_0122, by = "Request.ID")

via1022_1222 <- via1022_1222 %>%
select(Request.ID,Request.Status,Actual.Pickup.Time,Reason.For.Travel,Request.Creation.Time) %>%
mutate(Actual.Pickup.Time = ymd_hms(Actual.Pickup.Time), Request.Creation.Time = ymd_hms(Request.Creation.Time)) %>% anti_join(via0222_1022, by = "Request.ID")

via1222_0323 <- via1222_0323 %>%
select(Request.ID,Request.Status,Actual.Pickup.Time,Reason.For.Travel,Request.Creation.Time) %>%
mutate(Actual.Pickup.Time = ymd_hms(Actual.Pickup.Time), Request.Creation.Time = ymd_hms(Request.Creation.Time)) %>% anti_join(via1022_1222, by = "Request.ID")

via0323_0723 <- via0323_0723 %>%
select(Request.ID,Request.Status,Actual.Pickup.Time,Reason.For.Travel,Request.Creation.Time) %>%
mutate(Actual.Pickup.Time = ymd_hms(Actual.Pickup.Time), Request.Creation.Time = ymd_hms(Request.Creation.Time)) %>% anti_join(via1222_0323, by = "Request.ID")

test <- unique(via1022_1222$Request.Status)

# allData_via <- rbind(via0621_0122,via0222_1022,via1022_1222,via1222_0323,via0323_0723)
allData_via <- bind_rows(via0621_0122,via0222_1022)
allData_via <- bind_rows(allData_via,via1022_1222)
allData_via <- bind_rows(allData_via,via1222_0323)
allData_via <- bind_rows(allData_via,via0323_0723)
unique(allData_via$Request.Status)
unique(allData_ioki$Stornierungsgrund)
ids <- unique(allData_via$Request.ID)

naVia <- allData_via %>% filter(is.na(Actual.Pickup.Time))
#naVia2 <- allData_via %>% filter(is.na(Actual.Dropoff.Time))
naIoki2 <- allData_ioki %>% filter(is.na(Abfahrtszeit))

#print(via0621_0122)

# get all requests per day for each dataset and join them
requests_ioki <- allData_ioki %>% mutate(`Fahrtwunsch erstellt` = as.Date(dmy_hms(`Fahrtwunsch erstellt`))) %>% filter(!is.na(`Fahrtwunsch erstellt`)) %>%
mutate(dummy = 1) %>%
group_by(`Fahrtwunsch erstellt`) %>% summarize(noRequests = as.integer(sum(dummy))) %>%
Expand All @@ -71,6 +52,28 @@ requests_via <- allData_via %>%

requests_all <- rbind(requests_ioki,requests_via)

unique(allData_ioki$Stornierungsgrund)

# get all rejections (because of unavailable vehicle) per dataset and join
rejections_ioki <- allData_ioki %>%
filter(Stornierungsgrund == "no_vehicle_available") %>%
mutate(`Fahrtwunsch erstellt` = as.Date(dmy_hms(`Fahrtwunsch erstellt`))) %>% filter(!is.na(`Fahrtwunsch erstellt`)) %>%
mutate(dummy = 1) %>%
group_by(`Fahrtwunsch erstellt`) %>% summarize(noRejections = as.integer(sum(dummy))) %>%
rename(date = `Fahrtwunsch erstellt`)

rejections_via <- allData_via %>%
filter(Request.Status == "Seat Unavailable") %>%
filter(!is.na(`Request.Creation.Time`)) %>%
filter(Reason.For.Travel=="DR") %>%
mutate(`Request.Creation.Time` = as.Date(`Request.Creation.Time`)) %>%
mutate(dummy = 1) %>%
group_by(Request.Creation.Time) %>% summarize(noRejections = as.integer(sum(dummy))) %>%
rename(date = `Request.Creation.Time`)

rejections_all <- rbind(rejections_ioki, rejections_via)

# get all completed rides per dataset and join
allData_ioki <- allData_ioki %>% mutate(`Abfahrtszeit` = as.Date(dmy_hms(`Abfahrtszeit`))) %>% filter(!is.na(`Abfahrtszeit`))
allData_via <- allData_via %>%
filter(!is.na(`Actual.Pickup.Time`)) %>%
Expand All @@ -95,6 +98,7 @@ demandData_all <- rbind(demandData_ioki,demandData_via)

demandDataSince2022 <- demandData_all %>% filter(date >= as.Date(ymd("2022-01-01")))

write.csv2(demandData_all,"C:/Users/Simon/Documents/shared-svn/projects/KelRide/data/badWeather/data/allDemandByDate.csv", quote = FALSE, row.names=FALSE)
write.csv2(demandDataSince2022,"C:/Users/Simon/Documents/shared-svn/projects/KelRide/data/badWeather/data/allDemandByDateSince2022.csv", quote = FALSE, row.names=FALSE)
write.csv2(requests_all,"C:/Users/Simon/Documents/shared-svn/projects/KelRide/data/badWeather/data/allRequestsByDate.csv", quote = FALSE, row.names=FALSE)
write.csv2(demandData_all,"../../shared-svn/projects/KelRide/data/badWeather/data/allDemandByDate.csv", quote = FALSE, row.names=FALSE)
write.csv2(demandDataSince2022,"../../shared-svn/projects/KelRide/data/badWeather/data/allDemandByDateSince2022.csv", quote = FALSE, row.names=FALSE)
write.csv2(requests_all,"../../shared-svn/projects/KelRide/data/badWeather/data/allRequestsByDate.csv", quote = FALSE, row.names=FALSE)
write.csv2(rejections_all,"../../shared-svn/projects/KelRide/data/badWeather/data/rejectionsByDate.csv", quote = FALSE, row.names=FALSE)

0 comments on commit 1c650bd

Please sign in to comment.