tappyness1 commited on
Commit
33f164a
·
1 Parent(s): 471f224

modularising data ingestion

Browse files
Files changed (2) hide show
  1. app.py +1 -17
  2. src/data_ingestion.py +19 -0
app.py CHANGED
@@ -5,23 +5,7 @@ from datasets import load_dataset
5
  import os
6
  from src.basic_plot import basic_chart
7
  from src.map_viz import calling_map_viz
8
-
9
- def daily_average(counts_df):
10
-
11
- filtered_views_list = ['View_from_Second_Link_at_Tuas_to_sg',
12
- 'View_from_Second_Link_at_Tuas_to_jh',
13
- 'View_from_Tuas_Checkpoint_to_sg',
14
- 'View_from_Tuas_Checkpoint_to_jh',
15
- 'View_from_Woodlands_Causeway_Towards_Johor_to_sg',
16
- 'View_from_Woodlands_Causeway_Towards_Johor_to_jh',
17
- 'View_from_Woodlands_Checkpoint_Towards_BKE_to_sg',
18
- 'View_from_Woodlands_Checkpoint_Towards_BKE_to_jh']
19
-
20
- counts_df_filter_views = counts_df[counts_df['view'].isin(filtered_views_list)]
21
- counts_df_filter_views['date'] = pd.to_datetime(counts_df_filter_views['date'])
22
- counts_df_filter_views['day_of_week'] = counts_df_filter_views['date'].dt.day_of_week
23
- date_view_group = counts_df_filter_views.groupby(by=['view', 'day_of_week']).mean()
24
- date_view_group = date_view_group.reset_index()
25
 
26
 
27
  def main():
 
5
  import os
6
  from src.basic_plot import basic_chart
7
  from src.map_viz import calling_map_viz
8
+ from src.data_ingestion import daily_average
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9
 
10
 
11
  def main():
src/data_ingestion.py ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import pandas as pd
2
+ import numpy as np
3
+
4
+ def daily_average(counts_df):
5
+
6
+ filtered_views_list = ['View_from_Second_Link_at_Tuas_to_sg',
7
+ 'View_from_Second_Link_at_Tuas_to_jh',
8
+ 'View_from_Tuas_Checkpoint_to_sg',
9
+ 'View_from_Tuas_Checkpoint_to_jh',
10
+ 'View_from_Woodlands_Causeway_Towards_Johor_to_sg',
11
+ 'View_from_Woodlands_Causeway_Towards_Johor_to_jh',
12
+ 'View_from_Woodlands_Checkpoint_Towards_BKE_to_sg',
13
+ 'View_from_Woodlands_Checkpoint_Towards_BKE_to_jh']
14
+
15
+ counts_df_filter_views = counts_df[counts_df['view'].isin(filtered_views_list)]
16
+ counts_df_filter_views['date'] = pd.to_datetime(counts_df_filter_views['date'])
17
+ counts_df_filter_views['day_of_week'] = counts_df_filter_views['date'].dt.day_of_week
18
+ date_view_group = counts_df_filter_views.groupby(by=['view', 'day_of_week']).mean()
19
+ date_view_group = date_view_group.reset_index()