File size: 3,396 Bytes
e8059bf |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 |
.PHONY: clean dirs virtualenv lint requirements push pull reproduce
#################################################################################
# GLOBALS #
#################################################################################
PROJECT_DIR := $(shell dirname $(realpath $(lastword $(MAKEFILE_LIST))))
PYTHON_INTERPRETER = python3
#################################################################################
# COMMANDS #
#################################################################################
## Create virtualenv.
## Activate with the command:
## source env/bin/activate
virtualenv:
$(PYTHON_INTERPRETER) -m venv env
$(info "Activate with the command 'source env/bin/activate'")
## Install Python Dependencies.
## Make sure you activate the virtualenv first!
requirements:
$(PYTHON_INTERPRETER) -m pip install -U pip setuptools wheel
$(PYTHON_INTERPRETER) -m pip install -r requirements.txt
## Create directories that are ignored by git but required for the project
dirs:
mkdir -p data/raw data/processed models
## Delete all compiled Python files
clean:
find . -type f -name "*.py[co]" -delete
find . -type d -name "__pycache__" -delete
## To use the pre-commit hooks
pre-commit-install:
pre-commit install
setup-data-validation:
cd src/data; great_expectations -y init; great_expectations datasource new
run-data-validation:
cd src/data; python data_validation.py
## Lint using flake8
lint:
flake8 src
## Upload Data to default DVC remote
push:
dvc push -r origin
## Download Data from default DVC remote
pull:
dvc pull -r origin
## Reproduce the DVC pipeline - recompute any modified outputs such as processed data or trained models
reproduce:
dvc repro
#################################################################################
# PROJECT RULES #
#################################################################################
#################################################################################
# Self Documenting Commands #
#################################################################################
.DEFAULT_GOAL := reproduce
# Inspired by <http://marmelab.com/blog/2016/02/29/auto-documented-makefile.html>
# sed script explained:
# /^##/:
# * save line in hold space
# * purge line
# * Loop:
# * append newline + line to hold space
# * go to next line
# * if line starts with doc comment, strip comment character off and loop
# * remove target prerequisites
# * append hold space (+ newline) to line
# * replace newline plus comments by `---`
# * print line
# Separate expressions are necessary because labels cannot be delimited by
# semicolon; see <http://stackoverflow.com/a/11799865/1968>
.PHONY: help
help:
@echo "$$(tput bold)Available rules:$$(tput sgr0)"
@echo
@sed -n -e "/^## / Missing" $Missing \
| LC_ALL='C' sort --ignore-case \
| awk -F '---' \
-v ncol=$$(tput cols) \
-v indent=19 \
-v col_on="$$(tput setaf 6)" \
-v col_off="$$(tput sgr0)" \
'Missing \
printf "%s ", words[i]; \
} \
printf "\n"; \
}' \
| more $(shell test $(shell uname) = Darwin && echo '--no-init --raw-control-chars')
|