-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathMakefile
executable file
·216 lines (181 loc) · 7.05 KB
/
Makefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
IMAGE = disaster
PACKAGE = disaster
CLOUD_ROOT = s3://data-analytics-nw/models
PWD := $(shell pwd)
UID := $(shell id -u)
GID := $(shell id -g)
USER := $(UID):$(GID)
DOCKER_VOLUME := $(PWD)/workspace
DOCKER_APP := /app
DOCKER_FOLDER := $(DOCKER_APP)/workspace
DOCKER_RUN = docker run -t --rm \
--user $(USER) \
-v $(DOCKER_VOLUME):$(DOCKER_FOLDER) \
-e APP_VERSION=$(VERSION)
STATUS_PREFIX = "\033[1;32m[+]\033[0m "
ATTENTION_PREFIX = "\033[1;36m[!]\033[0m "
help:
@echo "usage: make <command> [VERSION=X.Y.Z]"
@echo
@echo "COMMANDS"
@echo " check Run unit-tests and linters"
@echo " shell Enter into a shell (sh) of the docker container."
@echo " jupyter Launch jupyterlab with the software installed as library."
@echo " jupyter-notebook Launch jupyterlab with the software installed as library."
@echo " build Build docker image from Dockerfile."
@echo " release [Need VERSION] Release a new version of software as tag."
@echo " dist [Need VERSION] Generate Python packages to workspace/dist."
@echo " clean Clean workspace/dist software distribution"
@echo " split Generate train/valid/test sets"
@echo " process Pre-process text for NLP tasks"
@echo " features Generates train data for the model and store it to workspace/data/ ."
@echo " select Feature Selection based on training data only"
@echo " train Train models with the generated data and store the binaries at workspace/model/."
@echo " metadata Create metadata for the trained model at workspace/."
@echo " predict [Need INPUT] Use trained model to predict data specified on the INPUT variable."
@echo " run Run the full pipeline."
@echo " skip Run pipeline by skipping split/process/features/select."
@echo " docs Generate html documentation based on doc files (md) and source code."
@echo
@echo "VARS"
@echo " VERSION Software Version variable."
@echo " INPUT Path for data to be predicted."
@echo " PARAMS Parameters to pass as: $ disaster <command> $(PARAMS)."
# Variable set checking
guard-%:
@ if [ "${${*}}" = "" ]; then echo "Variable '$*' not set"; exit 1; fi
#################
# User Commands #
#################
split: build
$(DOCKER_RUN) $(IMAGE) split $(PARAMS)
process: build
$(DOCKER_RUN) $(IMAGE) process $(PARAMS)
features: build
$(DOCKER_RUN) $(IMAGE) features $(PARAMS)
select: build
$(DOCKER_RUN) $(IMAGE) select $(PARAMS)
train: build
$(DOCKER_RUN) $(IMAGE) train $(PARAMS)
metadata: build
$(DOCKER_RUN) $(IMAGE) metadata $(PARAMS)
predict: guard-INPUT mkdir-predict
$(DOCKER_RUN) -v $(PWD)/predict:$(DOCKER_APP)/predict \
$(IMAGE) predict --input-data $(INPUT) $(PARAMS)
run: build
$(DOCKER_RUN) $(IMAGE) run $(PARAMS)
skip: build
$(DOCKER_RUN) $(IMAGE) skip $(PARAMS)
jupyter:
@printf $(STATUS_PREFIX); echo "PREPARING JUPYTERLAB ENVIRONMENT"
@docker kill jupyter 2> /dev/null || echo No jupyter running now
docker run -d --rm -p 8888:8888 \
-e JUPYTER_ENABLE_LAB=yes \
--name="jupyter" \
--user root \
-e NB_UID=$(UID) -e NB_GID=$(GID) \
-v $(PWD):/home/jovyan/work \
jupyter/datascience-notebook \
start.sh jupyter lab --LabApp.token=''
docker exec -t jupyter \
pip --disable-pip-version-check \
--no-cache-dir \
install -e /home/jovyan/work/.
docker exec -t -d jupyter chown -R $(USER) /home/jovyan/work/.
@printf $(ATTENTION_PREFIX); echo "JupyterLab: http://127.0.0.1:8888"
jupyter-notebook:
@printf $(STATUS_PREFIX); echo "PREPARING JUPYTER NOTEBOOK ENVIRONMENT"
@docker kill jupyter 2> /dev/null || echo No jupyter running now
docker run -d --rm -p 8888:8888 \
--name="jupyter" \
--user root \
-e NB_UID=$(UID) -e NB_GID=$(GID) \
-v $(PWD):/home/jovyan/work \
jupyter/datascience-notebook \
start.sh jupyter notebook --NotebookApp.token=''
docker exec -t jupyter \
pip --disable-pip-version-check \
--no-cache-dir \
install -e /home/jovyan/work/.
docker exec -t -d jupyter chown -R $(USER) /home/jovyan/work/.
@printf $(ATTENTION_PREFIX); echo "JupyterNotebook: http://127.0.0.1:8888"
# Enter in shell of the Docker container for debugging purposes
shell: build
@printf $(STATUS_PREFIX); echo "OPEN SHELL"
$(DOCKER_RUN) -it --entrypoint="sh" $(IMAGE)
# Tag software and push to repository
release: guard-VERSION check
@printf $(STATUS_PREFIX); echo "CREATE NEW GIT TAG" $(VERSION)
git tag -a $(VERSION) -m "Auto-generated release $(VERSION)"
git push origin master tag $(VERSION)
# Distribute software in multiple formats
dist: guard-VERSION build clean
@printf $(STATUS_PREFIX); echo "DISTRIBUTE SOFTWARE PACKAGES IN" $(DOCKER_VOLUME)/dist/
$(DOCKER_RUN) --entrypoint="python3" $(IMAGE) \
setup.py bdist_egg \
--dist-dir $(DOCKER_FOLDER)/dist/
$(DOCKER_RUN) --entrypoint="python3" $(IMAGE) \
setup.py bdist_wheel \
--dist-dir $(DOCKER_FOLDER)/dist/
$(DOCKER_RUN) --entrypoint="python3" $(IMAGE) \
setup.py bdist --formats=gztar \
--dist-dir $(DOCKER_FOLDER)/dist/
# Build docker image, run lint & unit-tests
check: build lint tests
tests:
@printf $(STATUS_PREFIX); echo "RUN UNIT-TESTS"
$(DOCKER_RUN) --entrypoint="pytest" $(IMAGE) \
--cov=$(PACKAGE)/
lint: flake8 mypy bandit
mypy:
@printf $(STATUS_PREFIX); echo "LINT MYPY: TYPE CHECKING"
$(DOCKER_RUN) --entrypoint="mypy" $(IMAGE) \
--ignore-missing-imports \
--strict-optional \
$(PACKAGE)/
flake8:
@printf $(STATUS_PREFIX); echo "LINT FLAKE8: STYLE CHECKING"
$(DOCKER_RUN) --entrypoint="flake8" $(IMAGE) \
$(PACKAGE)/
bandit:
@printf $(STATUS_PREFIX); echo "LINT BANDIT: SECURITY CHECKING"
$(DOCKER_RUN) --entrypoint="bandit" $(IMAGE) \
$(PACKAGE)/ -r
clean-dist:
@printf $(STATUS_PREFIX); echo "CLEAN DIST FOLDER"
$(DOCKER_RUN) --entrypoint="sh" $(IMAGE) \
-c 'rm -f $(DOCKER_FOLDER)/dist/*'
rm -rf $(DOCKER_VOLUME)/dist/
clean: clean-dist
rm -rf disaster.egg_info
find . -iname __pycache__ | xargs rm -rf
###################################
# CI, Docker and Release commands #
###################################
# Build docker image
build: mkdir-workspace
@printf $(STATUS_PREFIX); echo "BUILD DOCKER IMAGE"
docker build -t $(IMAGE) .
# Build docker requirements image
build-docs:
@printf $(STATUS_PREFIX); echo "BUILD DOCKER REQUIREMENTS IMAGE"
docker build -t "$(IMAGE).docs" -f docs/hack/Dockerfile .
mkdir-%:
mkdir -p $(PWD)/$*
chmod a+w $(PWD)/$*
clean-workspace:
@printf $(STATUS_PREFIX); echo "CLEAN FILESYSTEM"
$(DOCKER_RUN) --entrypoint="sh" $(IMAGE) \
-c 'rm -rf $(DOCKER_FOLDER)/*'
clean-ci: clean-workspace
rm -rf $(DOCKER_VOLUME)
docs: build-docs
@printf $(STATUS_PREFIX); echo "GENERATE AUTO DOCUMENTATON"
docker run \
--user $(shell id -u):$(shell id -g) \
--rm \
-v $(PWD):/workspace \
-w /workspace \
"$(IMAGE).docs" \
bash docs/hack/docs.sh
.PHONY: clean flake8 mypy flake8 tests lint help docs