generated from SiddharthaShandilya/air_quality_index_prediction
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathdvc.yaml
94 lines (81 loc) · 2.75 KB
/
dvc.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
stages:
FETCHING_DATA:
cmd: python src/stage_01_retrieve_html.py --config config/config.yaml
deps:
- src/stage_01_retrieve_html.py
- src/utils/all_utils.py
- config/config.yaml
outs:
- artifacts/Data_archive/dementia_dataset/dementia_dataset.csv
- logs/stage_01_running_logs.log
#Extracting and combining data:
# cmd: python src/stage_02_EDA.py --config config/config.yaml
# deps:
# - src/stage_02_Extract_combine.py
# - src/stage_01_retrieve_html.py
# - src/utils/all_utils.py
# - config/config.yaml
# #- artifacts/data/AQI/aqi2013.csv
# - artifacts/Data_archive/AQI/
# - artifacts/Data_archive/Html_Data
# - requirements.txt
# outs:
# - artifacts/Data_archive/Real-Data/Real_Combine.csv
Exploratory_Data_Analysis:
cmd: python src/stage_02_EDA.py --config config/config.yaml
deps:
- src/stage_02_EDA.py
- artifacts/Data_archive/dementia_dataset/dementia_dataset.csv
- src/utils/all_utils.py
- config/config.yaml
- requirements.txt
outs:
- artifacts/reports_dir/graphs_dir/
- artifacts/Data_archive/Real-Data/Cleaned_Real_Combined_data.csv
- logs/stage_02_running_logs.log
Splitting_Data:
cmd: python src/stage_03_splitting_data.py --config config/config.yaml --params params.yaml
deps:
- src/stage_03_splitting_data.py
- artifacts/Data_archive/Real-Data/Cleaned_Real_Combined_data.csv
- src/utils/all_utils.py
- config/config.yaml
- requirements.txt
- params.yaml
outs:
- artifacts/split_data_dir/
- logs/stage_03_running_logs.log
TRAINING_AND_GENERATING_MODEL:
cmd: python src/stage_04_xgboost_regression.py --config config/config.yaml --params params.yaml
deps:
- src/stage_04_xgboost_regression.py
- artifacts/split_data_dir/train_data_dir
- src/utils/all_utils.py
- config/config.yaml
- requirements.txt
- params.yaml
outs:
- artifacts/trained_model/
- artifacts/reports_dir/scores.json
- logs/stage_04_running_logs.log
TESTING_AND_GENERATING_GRAPH:
cmd: python src/stage_05_model_accuracy_testing.py --config config/config.yaml
deps:
- src/stage_05_model_accuracy_testing.py
- artifacts/split_data_dir/test_data_dir
- artifacts/trained_model/
- src/utils/all_utils.py
- config/config.yaml
- requirements.txt
outs:
- artifacts/reports_dir/trained_model_graph_dir
- logs/stage_05_running_logs.log
# cannot use this stage for git hub action
# LAUNCHING_WEB_APPLICATION:
# cmd: python app.py
# deps:
# - app.py
# - templates/
# - artifacts/trained_model/
# - static/
# - config/config.yaml