Skip to content

Commit c196e8e

Browse files
authored
Better checksum calculation (aio-libs#5183)
1 parent 46d2ed9 commit c196e8e

File tree

5 files changed

+102
-49
lines changed

5 files changed

+102
-49
lines changed

.github/workflows/ci.yml

+1-26
Original file line numberDiff line numberDiff line change
@@ -115,27 +115,16 @@ jobs:
115115
path: ${{ steps.pip-cache.outputs.dir }}
116116
restore-keys: |
117117
pip-ci-${{ runner.os }}-${{ matrix.pyver }}-{{ matrix.no-extensions }}-
118-
- name: Install cython
119-
if: ${{ matrix.no-extensions == '' }}
120-
uses: py-actions/py-dependency-install@v2
121-
with:
122-
path: requirements/cython.txt
123118
- name: Cythonize
124119
if: ${{ matrix.no-extensions == '' }}
125120
run: |
126121
make cythonize
127-
- name: Install dependencies
128-
uses: py-actions/py-dependency-install@v2
129-
with:
130-
path: requirements/test.txt
131-
env:
132-
AIOHTTP_NO_EXTENSIONS: ${{ matrix.no-extensions }}
133122
- name: Run unittests
134123
env:
135124
COLOR: 'yes'
136125
AIOHTTP_NO_EXTENSIONS: ${{ matrix.no-extensions }}
137126
run: |
138-
python -m pytest tests -vv
127+
make vvtest
139128
python -m coverage xml
140129
- name: Upload coverage
141130
uses: codecov/codecov-action@v1
@@ -168,10 +157,6 @@ jobs:
168157
uses: actions/setup-python@v2
169158
with:
170159
python-version: 3.8
171-
- name: Install cython
172-
uses: py-actions/py-dependency-install@v2
173-
with:
174-
path: requirements/cython.txt
175160
- name: Cythonize
176161
run: |
177162
make cythonize
@@ -210,11 +195,6 @@ jobs:
210195
uses: actions/setup-python@v2
211196
with:
212197
python-version: 3.8
213-
- name: Install cython
214-
if: ${{ matrix.no-extensions == '' }}
215-
uses: py-actions/py-dependency-install@v2
216-
with:
217-
path: requirements/cython.txt
218198
- name: Cythonize
219199
if: ${{ matrix.no-extensions == '' }}
220200
run: |
@@ -255,11 +235,6 @@ jobs:
255235
uses: actions/setup-python@v2
256236
with:
257237
python-version: ${{ matrix.pyver }}
258-
- name: Install cython
259-
if: ${{ matrix.no-extensions == '' }}
260-
uses: py-actions/py-dependency-install@v2
261-
with:
262-
path: requirements/cython.txt
263238
- name: Cythonize
264239
if: ${{ matrix.no-extensions == '' }}
265240
run: |

.gitignore

+1
Original file line numberDiff line numberDiff line change
@@ -20,6 +20,7 @@
2020
.envrc
2121
.flake
2222
.gitconfig
23+
.hash
2324
.idea
2425
.install-cython
2526
.install-deps

Makefile

+49-22
Original file line numberDiff line numberDiff line change
@@ -1,47 +1,67 @@
11
# Some simple testing tasks (sorry, UNIX only).
22

3-
to-md5 = $1 $(addsuffix .md5,$1)
3+
to-hash-one = $(dir $1).hash/$(addsuffix .hash,$(notdir $1))
4+
to-hash = $(foreach fname,$1,$(call to-hash-one,$(fname)))
45

5-
CYS = $(wildcard aiohttp/*.pyx) $(wildcard aiohttp/*.pyi) $(wildcard aiohttp/*.pxd)
6-
PYXS = $(wildcard aiohttp/*.pyx)
7-
CS = $(wildcard aiohttp/*.c)
8-
PYS = $(wildcard aiohttp/*.py)
9-
REQS = $(wildcard requirements/*.txt)
10-
SRC = aiohttp examples tests setup.py
6+
CYS := $(wildcard aiohttp/*.pyx) $(wildcard aiohttp/*.pyi) $(wildcard aiohttp/*.pxd)
7+
PYXS := $(wildcard aiohttp/*.pyx)
8+
CS := $(wildcard aiohttp/*.c)
9+
PYS := $(wildcard aiohttp/*.py)
10+
REQS := $(wildcard requirements/*.txt)
11+
ALLS := $(sort $(CYS) $(CS) $(PYS) $(REQS))
1112

1213
.PHONY: all
1314
all: test
1415

15-
# Recipe from https://www.cmcrossroads.com/article/rebuilding-when-files-checksum-changes
16-
%.md5: FORCE
17-
@$(if $(filter-out $(shell cat $@ 2>/dev/null),$(shell md5sum $*)),md5sum $* > $@)
16+
tst:
17+
@echo $(call to-hash,requirements/cython.txt)
18+
@echo $(call to-hash,aiohttp/%.pyx)
19+
1820

21+
# Recipe from https://www.cmcrossroads.com/article/rebuilding-when-files-checksum-changes
1922
FORCE:
2023

24+
# check_sum.py works perfectly fine but slow when called for every file from $(ALLS)
25+
# (perhaps even several times for each file).
26+
# That is why much less readable but faster solution exists
27+
ifneq (, $(shell which sha256sum))
28+
%.hash: FORCE
29+
$(eval $@_ABS := $(abspath $@))
30+
$(eval $@_NAME := $($@_ABS))
31+
$(eval $@_HASHDIR := $(dir $($@_ABS)))
32+
$(eval $@_TMP := $($@_HASHDIR)../$(notdir $($@_ABS)))
33+
$(eval $@_ORIG := $(subst /.hash/../,/,$(basename $($@_TMP))))
34+
@#echo ==== $($@_ABS) $($@_HASHDIR) $($@_NAME) $($@_TMP) $($@_ORIG)
35+
@if ! (sha256sum --check $($@_ABS) 1>/dev/null 2>/dev/null); then \
36+
mkdir -p $($@_HASHDIR); \
37+
echo re-hash $($@_ORIG); \
38+
sha256sum $($@_ORIG) > $($@_ABS); \
39+
fi
40+
else
41+
%.hash: FORCE
42+
@./tools/check_sum.py $@ # --debug
43+
endif
44+
2145
# Enumerate intermediate files to don't remove them automatically.
22-
# The target must exist, no need to execute it.
23-
.PHONY: _keep-intermediate-files
24-
_keep-intermediate-files: $(addsuffix .md5,$(CYS))\
25-
$(addsuffix .md5,$(CS))\
26-
$(addsuffix .md5,$(PYS))\
27-
$(addsuffix .md5,$(REQS))
28-
29-
.install-cython: $(call to-md5,requirements/cython.txt)
46+
.SECONDARY: $(call to-hash,$(ALLS))
47+
48+
49+
.install-cython: $(call to-hash,requirements/cython.txt)
3050
pip install -r requirements/cython.txt
3151
@touch .install-cython
3252

33-
aiohttp/_find_header.c: $(call to-md5,aiohttp/hdrs.py)
53+
aiohttp/_find_header.c: $(call to-hash,aiohttp/hdrs.py ./tools/gen.py)
3454
./tools/gen.py
3555

3656
# _find_headers generator creates _headers.pyi as well
37-
aiohttp/%.c: $(call to-md5,aiohttp/%.pyx) aiohttp/_find_header.c
57+
aiohttp/%.c: aiohttp/%.pyx $(call to-hash,$(CYS)) aiohttp/_find_header.c
3858
cython -3 -o $@ $< -I aiohttp
3959

4060

4161
.PHONY: cythonize
4262
cythonize: .install-cython $(PYXS:.pyx=.c)
4363

44-
.install-deps: .install-cython $(PYXS:.pyx=.c) $(call to-md5,$(CYS) $(REQS))
64+
.install-deps: .install-cython $(PYXS:.pyx=.c) $(call to-hash,$(CYS) $(REQS))
4565
pip install -r requirements/dev.txt
4666
@touch .install-deps
4767

@@ -56,7 +76,7 @@ fmt format:
5676
mypy:
5777
mypy aiohttp
5878

59-
.develop: .install-deps $(call to-md5,$(PYS) $(CYS) $(CS))
79+
.develop: .install-deps $(call to-hash,$(PYS) $(CYS) $(CS))
6080
pip install -e .
6181
@touch .develop
6282

@@ -68,16 +88,23 @@ test: .develop
6888
vtest: .develop
6989
@pytest -s -v
7090

91+
.PHONY: vvtest
92+
vvtest: .develop
93+
@pytest -vv
94+
7195
.PHONY: clean
7296
clean:
7397
@rm -rf `find . -name __pycache__`
98+
@rm -rf `find . -name .hash`
99+
@rm -rf `find . -name .md5` # old styling
74100
@rm -f `find . -type f -name '*.py[co]' `
75101
@rm -f `find . -type f -name '*~' `
76102
@rm -f `find . -type f -name '.*~' `
77103
@rm -f `find . -type f -name '@*' `
78104
@rm -f `find . -type f -name '#*#' `
79105
@rm -f `find . -type f -name '*.orig' `
80106
@rm -f `find . -type f -name '*.rej' `
107+
@rm -f `find . -type f -name '*.md5' ` # old styling
81108
@rm -f .coverage
82109
@rm -rf htmlcov
83110
@rm -rf build

requirements/lint.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
black==20.8b1; python_version >= "3.6"
1+
black==20.8b1; implementation_name=="cpython"
22
flake8==3.8.4
33
flake8-pyi==20.10.0
44
isort==5.6.4

tools/check_sum.py

+50
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,50 @@
1+
#!/usr/bin/env python
2+
3+
import argparse
4+
import hashlib
5+
import pathlib
6+
import sys
7+
8+
PARSER = argparse.ArgumentParser(
9+
description="Helper for check file hashes in Makefile instead of bare timestamps"
10+
)
11+
PARSER.add_argument("dst", metavar="DST", type=pathlib.Path)
12+
PARSER.add_argument("-d", "--debug", action="store_true", default=False)
13+
14+
15+
def main(argv):
16+
args = PARSER.parse_args(argv)
17+
dst = args.dst
18+
assert dst.suffix == ".hash"
19+
dirname = dst.parent
20+
if dirname.name != ".hash":
21+
if args.debug:
22+
print(f"Invalid name {dst} -> dirname {dirname}", file=sys.stderr)
23+
return 0
24+
dirname.mkdir(exist_ok=True)
25+
src_dir = dirname.parent
26+
src_name = dst.stem # drop .hash
27+
full_src = src_dir / src_name
28+
hasher = hashlib.sha256()
29+
try:
30+
hasher.update(full_src.read_bytes())
31+
except OSError:
32+
if args.debug:
33+
print(f"Cannot open {full_src}", file=sys.stderr)
34+
return 0
35+
src_hash = hasher.hexdigest()
36+
if dst.exists():
37+
dst_hash = dst.read_text()
38+
else:
39+
dst_hash = ""
40+
if src_hash != dst_hash:
41+
dst.write_text(src_hash)
42+
print(f"re-hash {src_hash}")
43+
else:
44+
if args.debug:
45+
print(f"Skip {src_hash} checksum, up-to-date")
46+
return 0
47+
48+
49+
if __name__ == "__main__":
50+
sys.exit(main(sys.argv[1:]))

0 commit comments

Comments
 (0)