-
Notifications
You must be signed in to change notification settings - Fork 1
/
explore.py
35 lines (24 loc) · 1.41 KB
/
explore.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
import analysis
from georgiatech import GeorgiaTech
import pandas as pd
gt_context = GeorgiaTech()
df = pd.read_csv("dataset_small.csv")
print()
# Plot data
df_sample = analysis.sample(df, 1000, ["route", "stop", "session", "approach"])
analysis.plot(df_sample, gt_context, "route", ("actualSecondsToArrival", "abserror"), 1)
analysis.plot(df_sample, gt_context, "route", ("distance", "abserror"), 1)
analysis.plot(df_sample, gt_context, "route", ("kmperhr", "abserror"), 1)
analysis.plot(df_sample, gt_context, "route", ("minutesIntoDay", "abserror"), 1)
analysis.plot(df_sample, gt_context, "route", ("layover", "actualSecondsToArrival"), 3)
analysis.plot(df_sample, gt_context, "route", ("wind", "actualSecondsToArrival"), 3)
analysis.plot(df_sample, gt_context, "route", ("pressure", "actualSecondsToArrival"), 3)
analysis.plot(df_sample, gt_context, "route", ("humidity", "actualSecondsToArrival"), 3)
analysis.plot(df_sample, gt_context, "route", ("visibility", "actualSecondsToArrival"), 3)
analysis.plot(df_sample, gt_context, "route", ("secondsToArrival", "actualSecondsToArrival"), 2)
analysis.plot(df_sample, gt_context, "cluster", ("secondsToArrival", "actualSecondsToArrival"), 2)
# Ancillary plots, showing heuristic validation and distance validation
df_sample = analysis.sample(df, 10, ["route", "stop", "session"])
analysis.plot_validation(df_sample)
for x in range(0,10):
analysis.plot_distance(df_sample)