-
Notifications
You must be signed in to change notification settings - Fork 0
/
Snakefile
71 lines (64 loc) · 1.71 KB
/
Snakefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
rule all:
input:
r'notebooks\01_exploratory_data_analysis_dummy.py',
r'notebooks\02_compare_models_dummy.py',
r'results\submission.csv'
rule download:
output:
r'data\raw\gender_submission.csv',
r'data\raw\test.csv',
r'data\raw\train.csv'
shell:
r'titanic download'
rule eda:
input:
r'data\raw\train.csv',
r'data\raw\test.csv',
r'references\data_dict.xlsx',
r'notebooks\01_exploratory_data_analysis_dummy.ipynb'
output:
r'notebooks\01_exploratory_data_analysis_dummy.py'
shell:
r'titanic eda'
rule features:
input:
r'data\raw\test.csv',
r'data\raw\train.csv'
output:
r'data\processed\X_train.pickle',
r'data\processed\X_test.pickle',
r'data\processed\y_train.pickle'
shell:
r'titanic features'
rule crossval:
input:
r'data\processed\X_train.pickle',
r'data\processed\y_train.pickle'
output:
r'models\logreg.pickle',
r'models\forest.pickle',
r'models\svc.pickle',
r'models\voting.pickle'
shell:
r'titanic crossval'
rule compmod:
input:
r'models\logreg.pickle',
r'models\forest.pickle',
r'models\svc.pickle',
r'models\voting.pickle',
r'notebooks\02_compare_models_dummy.ipynb'
output:
r'notebooks\02_compare_models_dummy.py'
shell:
r'titanic compmod'
rule submission:
input:
r'models\forest.pickle'
output:
r'results\submission.csv'
shell:
r'titanic submission'
rule clean:
shell:
r'titanic clean -a'