forked from acl-org/acl-anthology
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathMakefile
240 lines (198 loc) · 7.62 KB
/
Makefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
# -*- coding: utf-8 -*-
#
# Copyright 2019 Arne Köhn <[email protected]>
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# Instructions:
# - if you edit the a command running python, make sure to
# run . $(VENV) && python3 -- this sets up the virtual environment.
# - all targets running python somewhere should have venv as a dependency.
# this makes sure that all required packages are installed.
SHELL = /bin/sh
ANTHOLOGYHOST := "https://www.aclweb.org"
ANTHOLOGYDIR := anthology
HUGO_ENV ?= production
sourcefiles=$(shell find data -type f '(' -name "*.yaml" -o -name "*.xml" ')')
xmlstaged=$(shell git diff --staged --name-only --diff-filter=d data/xml/*.xml)
pysources=$(shell git ls-files | egrep "\.pyi?$$")
pystaged=$(shell git diff --staged --name-only --diff-filter=d | egrep "\.pyi?$$")
timestamp=$(shell date -u +"%d %B %Y at %H:%M %Z")
githash=$(shell git rev-parse HEAD)
githashshort=$(shell git rev-parse --short HEAD)
#######################################################
# check whether the correct python version is available
ifeq (, $(shell which python3 ))
$(error "python3 not found in $(PATH)")
endif
PYTHON_VERSION_MIN=3.7
PYTHON_VERSION=$(shell python3 -c 'import sys; print("%d.%d"% sys.version_info[0:2])' )
PYTHON_VERSION_OK=$(shell python3 -c 'import sys; print(int(float("%d.%d"% sys.version_info[0:2]) >= $(PYTHON_VERSION_MIN)))' )
ifeq ($(PYTHON_VERSION_OK),0)
$(error "Need python $(PYTHON_VERSION_MIN), but only found python $(PYTHON_VERSION)!")
endif
# end python check
#######################################################
# hugo version check
HUGO_VERSION_MIN=58
HUGO_VERSION=$(shell hugo version | sed 's/.*Generator v0.\(..\).*/\1/')
HUGO_VERSION_TOO_LOW:=$(shell [ $(HUGO_VERSION_MIN) -gt $(HUGO_VERSION) ] && echo true)
ifeq ($(HUGO_VERSION_TOO_LOW),true)
$(error "incorrect hugo version installed! Need hugo 0.$(HUGO_VERSION_MIN), but only found hugo 0.$(HUGO_VERSION)!")
endif
VENV := "venv/bin/activate"
.PHONY: site
site: bibtex mods endnote hugo sitemap
# Split the file sitemap into Google-ingestible chunks.
# Also build the PDF sitemap, and split it.
.PHONY: sitemap
sitemap: build/.sitemap
build/.sitemap: venv/bin/activate build/.hugo
. $(VENV) && python3 bin/split_sitemap.py build/anthology/sitemap.xml
@rm -f build/anthology/sitemap_*.xml.gz
@gzip -9n build/anthology/sitemap_*.xml
@bin/create_sitemapindex.sh `ls build/anthology/ | grep 'sitemap_.*xml.gz'` > build/anthology/sitemapindex.xml
@touch build/.sitemap
.PHONY: venv
venv: venv/bin/activate
# installs dependencies if requirements.txt have been updated.
# checks whether libyaml is enabled to ensure fast build times.
venv/bin/activate: bin/requirements.txt
test -d venv || python3 -m venv venv
. $(VENV) && pip3 install -Ur bin/requirements.txt
@python3 -c "from yaml import CLoader" 2> /dev/null || ( \
echo "WARNING No libyaml bindings enabled for pyyaml, your build will be several times slower than needed";\
echo " see the README on GitHub for more information")
touch venv/bin/activate
.PHONY: all
all: clean check site
.PHONY: basedirs
basedirs:
build/.basedirs
build/.basedirs:
@mkdir -p build/data-export
@mkdir -p build/content/papers
@touch build/.basedirs
# copies all files that are not automatically generated
# and creates empty directories as needed.
.PHONY: static
static: build/.static
build/.static: build/.basedirs $(shell find hugo -type f)
@echo "INFO Creating and populating build directory..."
@cp -r hugo/* build
@echo >> build/config.toml
@echo "[params]" >> build/config.toml
@echo " githash = \"${githash}\"" >> build/config.toml
@echo " githashshort = \"${githashshort}\"" >> build/config.toml
@echo " timestamp = \"${timestamp}\"" >> build/config.toml
@perl -pi -e "s/ANTHOLOGYDIR/$(ANTHOLOGYDIR)/g" build/index.html
@touch build/.static
.PHONY: yaml
yaml: build/.yaml
build/.yaml: build/.basedirs $(sourcefiles) venv/bin/activate
@echo "INFO Generating YAML files for Hugo..."
. $(VENV) && python3 bin/create_hugo_yaml.py --clean
@touch build/.yaml
.PHONY: hugo_pages
hugo_pages: build/.pages
build/.pages: build/.basedirs build/.yaml venv/bin/activate
@echo "INFO Creating page templates for Hugo..."
. $(VENV) && python3 bin/create_hugo_pages.py --clean
@touch build/.pages
.PHONY: bibtex
bibtex: build/.bibtex
build/.bibtex: build/.basedirs $(sourcefiles) venv/bin/activate
@echo "INFO Creating BibTeX files..."
. $(VENV) && python3 bin/create_bibtex.py --clean
@touch build/.bibtex
.PHONY: mods
mods: build/.mods
build/.mods: build/.bibtex
@echo "INFO Converting BibTeX files to MODS XML..."
@find build/data-export -name '*.bib' -print0 | \
xargs -0 -n 1 -P 8 bin/bib2xml_wrapper >/dev/null
@touch build/.mods
.PHONY: endnote
endnote: build/.endnote
build/.endnote: build/.mods
@echo "INFO Converting MODS XML files to EndNote..."
@find build/data-export -name '*.xml' -print0 | \
xargs -0 -n 1 -P 8 bin/xml2end_wrapper >/dev/null
@touch build/.endnote
%.endf: %.xml
xml2end $< 2>&1 > $@
.PHONY: hugo
hugo: build/.hugo
build/.hugo: build/.static build/.pages build/.bibtex build/.mods build/.endnote
@echo "INFO Running Hugo... this may take a while."
@cd build && \
hugo -b $(ANTHOLOGYHOST)/$(ANTHOLOGYDIR) \
-d $(ANTHOLOGYDIR) \
-e $(HUGO_ENV) \
--cleanDestinationDir \
--minify
@touch build/.hugo
.PHONY: test
test: hugo
diff -u build/anthology/P19-1007.bib test/data/P19-1007.bib
diff -u build/anthology/P19-1007.xml test/data/P19-1007.xml
.PHONY: clean
clean:
rm -rf build
.PHONY: check
check: venv
@if grep -rl ' ' data/xml; then \
echo "check error: found a tab character in the above XML files!"; \
exit 1; \
fi
jing -c data/xml/schema.rnc data/xml/*xml
SKIP=no-commit-to-branch . $(VENV) \
&& pre-commit run --all-files \
&& black --check $(pysources)
.PHONY: check_staged_xml
check_staged_xml:
@if [ ! -z "$(xmlstaged)" ]; then \
jing -c data/xml/schema.rnc $(xmlstaged) ;\
fi
.PHONY: check_commit
check_commit: check_staged_xml venv
@. $(VENV) && pre-commit run
@if [ ! -z "$(pystaged)" ]; then \
. $(VENV) && black --check $(pystaged) ;\
fi
.PHONY: autofix
autofix: check_staged_xml venv
@. $(VENV) && \
EXIT_STATUS=0 ;\
pre-commit run || EXIT_STATUS=$$? ;\
PRE_DIFF=`git diff --no-ext-diff --no-color` ;\
black $(pysources) || EXIT_STATUS=$$? ;\
POST_DIFF=`git diff --no-ext-diff --no-color` ;\
[ "$${PRE_DIFF}" = "$${POST_DIFF}" ] || EXIT_STATUS=1 ;\
[ $${EXIT_STATUS} -eq 0 ]
.PHONY: serve
serve:
@echo "INFO Starting a server at http://localhost:8000/"
@cd build && python3 -m http.server 8000
# this target does not use ANTHOLOGYDIR because the official website
# only works if ANTHOLOGYDIR == anthology.
.PHONY: upload
upload:
@if [[ $(ANTHOLOGYDIR) != "anthology" ]]; then \
echo "WARNING: Can't upload because ANTHOLOGYDIR was set to '$(ANTHOLOGYDIR)' instead of 'anthology'"; \
exit 1; \
fi
@echo "INFO Running rsync..."
# main site
@rsync -azve ssh --delete build/anthology/ [email protected]:anthology-static
# aclanthology.org
# @rsync -azve ssh --delete build/anthology/ [email protected]:/var/www/html