forked from PSLmodels/taxdata
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathMakefile
163 lines (143 loc) · 6.3 KB
/
Makefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
# GNU Makefile that documents and automates common development operations
# using the GNU make tool (version >= 3.81)
# Development is typically conducted on Linux or Max OS X (with the Xcode
# command-line tools installed), so this Makefile is designed
# to work in that environment (and not on Windows).
# Note that the re-zipping of each .csv.gz file "removes" the time-stamp
# from the GZIP file header, which is necessary for git to
# report the correct status of each .csv.gz file's contents.
# USAGE: taxdata$ make [TARGET]
MADE_FILES = data/cps-matched-puf.csv \
puf_stage1/growfactors.csv \
puf_stage1/Stage_I_factors.csv \
puf_stage2/puf_weights.csv.gz \
puf_stage3/puf_ratios.csv.gz \
data/cps.csv.gz \
cps_stage1/stage_2_targets.csv \
cps_stage2/cps_weights.csv.gz
.PHONY=help
help:
@echo "USAGE: make [TARGET]"
@echo "TARGETS:"
@echo "help : show help message"
@echo "clean : remove all .pyc files"
@echo "clean CSV=x : remove all .pyc files and all made files listed in"
@echo " puf-files and cps-files targets"
@echo "pytest : generate report for and cleanup after pytest"
@echo "cstest : generate coding-style errors with pycodestyle"
@echo "git-sync : synchronize local, origin, and upstream Git repos"
@echo "git-pr N=n : create local pr-n branch containing upstream PR"
@echo "puf-files : make each of the following files:"
@echo " cps-matched-puf.csv"
@echo " puf.csv"
@echo " growfactors.csv"
@echo " puf_weights.csv.gz"
@echo " puf_ratios.csv"
@echo "cps-files : make each of the following files:"
@echo " cps.csv.gz"
@echo " cps_weights.csv.gz"
@echo " cps_benefits.csv.gz"
@echo "all : make both puf-files and cps-files"
.PHONY=clean
clean:
@find . -name *pyc -exec rm {} \;
ifeq ($(CSV),x)
@echo "The CSV=x option logic is not yet implemented"
# @rm -f $(MADE_FILES)
else
@echo "No CSV=x option used so skipping removal of all made files"
endif
define pytest-cleanup
find . -name *cache -maxdepth 1 -exec rm -r {} \;
endef
.PHONY=pytest
pytest:
@pytest -n4
@$(pytest-cleanup)
.PHONY=cstest
cstest:
pycodestyle .
.PHONY=git-sync
git-sync:
@./gitsync
.PHONY=git-pr
git-pr:
@./gitpr $(N)
.PHONY=puf-files
puf-files: data/cps-matched-puf.csv \
puf_stage1/growfactors.csv \
puf_stage2/puf_weights.csv.gz \
puf_stage3/puf_ratios.csv
# PM_DIR=./puf_data/StatMatch/Matching
# PM_PY_FILES := $(shell ls -l $(PM_DIR)/*py | awk '{print $$9}')
# data/cps-matched-puf.csv: $(PM_PY_FILES) \
# $(PM_DIR)/puf2011.csv \
# $(PM_DIR)/cpsmar2016.csv
# cd $(PM_DIR) ; python runmatch.py
data/cps-matched-puf.csv: taxdata/puf/finalprep.py \
taxdata/puf/impute_itmexp.py \
taxdata/puf/impute_pencon.py\
createpuf.py
python createpuf.py
# Above recipe also makes data/puf.csv
puf_stage1/Stage_I_factors.csv: puf_stage1/stage1.py \
puf_stage1/CBO_baseline.csv \
puf_stage1/IRS_return_projection.csv \
puf_stage1/NC-EST2014-AGESEX-RES.csv \
puf_stage1/NP2014_D1.csv \
puf_stage1/SOI_estimates.csv \
puf_stage1/US-EST00INT-ALLDATA.csv
cd puf_stage1 ; python stage1.py
# above recipe also makes puf_stage1/Stage_II_targets.csv
puf_stage1/growfactors.csv: puf_stage1/factors_finalprep.py \
puf_stage1/Stage_I_factors.csv \
puf_stage1/benefit_growth_rates.csv
cd puf_stage1 ; python factors_finalprep.py
puf_stage2/puf_weights.csv.gz: puf_stage2/stage2.py \
puf_stage2/dataprep.py \
puf_stage2/solver.jl \
data/cps-matched-puf.csv \
puf_stage1/Stage_I_factors.csv \
puf_stage1/Stage_II_targets.csv
cd puf_stage2 ; python stage2.py && \
gunzip puf_weights.csv.gz && gzip -n puf_weights.csv
puf_stage3/puf_ratios.csv: puf_stage3/stage3.py \
puf_stage3/stage3_targets.csv \
data/cps-matched-puf.csv \
puf_stage1/growfactors.csv \
puf_stage2/puf_weights.csv.gz
cd puf_stage3 ; python stage3.py
.PHONY=cps-files
cps-files: data/cps_raw.csv.gz \
cps_stage1/stage_2_targets.csv \
cps_stage2/cps_weights.csv.gz
data/cps_raw.csv.gz: taxdata/cps/create.py \
taxdata/cps/benefits.py \
taxdata/cps/filing_rules.json \
taxdata/cps/finalprep.py \
taxdata/cps/helpers.py \
taxdata/cps/impute.py \
taxdata/cps/pycps.py \
taxdata/cps/splitincome.py \
taxdata/cps/targeting.py \
taxdata/cps/taxunit.py \
taxdata/cps/transform_sas.py \
taxdata/cps/adjustment_targets.csv \
taxdata/cps/benefitprograms.csv
python createcps.py ; cd data &&\
gunzip cps.csv.gz && gzip -n cps.csv
cps_stage1/stage_2_targets.csv: cps_stage1/stage1.py \
cps_stage1/SOI_estimates.csv \
puf_stage1/Stage_I_factors.csv \
puf_stage1/Stage_II_targets.csv
cd cps_stage1 ; python stage1.py
cps_stage2/cps_weights.csv.gz: cps_stage2/stage2.py \
cps_stage2/dataprep.py \
data/cps_raw.csv.gz \
puf_stage1/Stage_I_factors.csv \
cps_stage1/stage_2_targets.csv \
cps_stage2/solver.jl
cd cps_stage2 ; python stage2.py && \
gunzip cps_weights.csv.gz && gzip -n cps_weights.csv
.PHONY=all
all: puf-files cps-files