-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathMakefile
141 lines (120 loc) · 3.96 KB
/
Makefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
.PHONY: clean data lint requirements sync_data_to_s3 sync_data_from_s3 features
#################################################################################
# GLOBALS #
#################################################################################
PROJECT_DIR := $(shell dirname $(realpath $(lastword $(MAKEFILE_LIST))))
BUCKET = [OPTIONAL] your-bucket-for-syncing-data (do not include 's3://')
PROFILE = default
PROJECT_NAME = data_science_for_business_lmu
PYTHON_INTERPRETER = python
#################################################################################
# COMMANDS #
#################################################################################
## Make Dataset
data: requirements
$(PYTHON_INTERPRETER) src/data/make_dataset.py
## Delete all compiled Python files
clean:
find . -type f -name "*.py[co]" -delete
find . -type d -name "__pycache__" -delete
## Lint using flake8
lint:
flake8 src
features:
$(PYTHON_INTERPRETER) src/features/build_features.py False
features_random_meta:
ifdef max
$(PYTHON_INTERPRETER) src/features/random_features.py $(max)
else
$(PYTHON_INTERPRETER) src/features/random_features.py 10
endif
features_random:
$(PYTHON_INTERPRETER) src/features/build_features.py True
train_models:
ifdef feature_set
$(PYTHON_INTERPRETER) src/models/build_model.py $(feature_set) ""
else
$(PYTHON_INTERPRETER) src/models/build_model.py 1 ""
endif
lbm_model:
ifdef feature_set
$(PYTHON_INTERPRETER) src/models/build_model.py $(feature_set) lbm
else
$(PYTHON_INTERPRETER) src/models/build_model.py 1 lbm
endif
catboost_model:
ifdef feature_set
$(PYTHON_INTERPRETER) src/models/build_model.py $(feature_set) catboost
else
$(PYTHON_INTERPRETER) src/models/build_model.py 1 catboost
endif
fit_models:
$(PYTHON_INTERPRETER) src/models/base_model.py
model_chain:
$(PYTHON_INTERPRETER) src/models/model_chain.py feature_set_meta.json False
stacking:
ifdef feature_set
$(PYTHON_INTERPRETER) src/models/stacking/stack_models.py $(feature_set)
else
$(PYTHON_INTERPRETER) src/models/stacking/stack_models.py 1
endif
shap_plots:
$(PYTHON_INTERPRETER) src/models/model_chain.py feature_set_meta.json True
#################################################################################
# Self Documenting Commands #
#################################################################################
.DEFAULT_GOAL := help
# Inspired by <http://marmelab.com/blog/2016/02/29/auto-documented-makefile.html>
# sed script explained:
# /^##/:
# * save line in hold space
# * purge line
# * Loop:
# * append newline + line to hold space
# * go to next line
# * if line starts with doc comment, strip comment character off and loop
# * remove target prerequisites
# * append hold space (+ newline) to line
# * replace newline plus comments by `---`
# * print line
# Separate expressions are necessary because labels cannot be delimited by
# semicolon; see <http://stackoverflow.com/a/11799865/1968>
.PHONY: help
help:
@echo "$$(tput bold)Available rules:$$(tput sgr0)"
@echo
@sed -n -e "/^## / { \
h; \
s/.*//; \
:doc" \
-e "H; \
n; \
s/^## //; \
t doc" \
-e "s/:.*//; \
G; \
s/\\n## /---/; \
s/\\n/ /g; \
p; \
}" ${MAKEFILE_LIST} \
| LC_ALL='C' sort --ignore-case \
| awk -F '---' \
-v ncol=$$(tput cols) \
-v indent=19 \
-v col_on="$$(tput setaf 6)" \
-v col_off="$$(tput sgr0)" \
'{ \
printf "%s%*s%s ", col_on, -indent, $$1, col_off; \
n = split($$2, words, " "); \
line_length = ncol - indent; \
for (i = 1; i <= n; i++) { \
line_length -= length(words[i]) + 1; \
if (line_length <= 0) { \
line_length = ncol - indent - length(words[i]) - 1; \
printf "\n%*s ", -indent, " "; \
} \
printf "%s ", words[i]; \
} \
printf "\n"; \
}' \
| more $(shell test $(shell uname) = Darwin && echo '--no-init --raw-control-chars')