From a1cd256d0eb9b7b1fae9ac219e91ae2fd4e72430 Mon Sep 17 00:00:00 2001 From: Michał Górny Date: Sun, 19 Nov 2017 12:45:00 +0100 Subject: Add ultra-fast Manifest writing scripts --- utils/gen_fast_manifest.py | 121 +++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 121 insertions(+) create mode 100755 utils/gen_fast_manifest.py (limited to 'utils/gen_fast_manifest.py') diff --git a/utils/gen_fast_manifest.py b/utils/gen_fast_manifest.py new file mode 100755 index 0000000..74cd759 --- /dev/null +++ b/utils/gen_fast_manifest.py @@ -0,0 +1,121 @@ +#!/usr/bin/env python +# Ultra-optimized Manifest writing. +# (c) 2017 Michał Górny +# Licensed under the terms of 2-clause BSD license + +import errno +import glob +import gzip +import hashlib +import io +import os +import os.path +import sys + +import pyblake2 + + +def get_manifest_entry(t, path, relpath): + sha512 = hashlib.sha512() + blake2 = pyblake2.blake2b() + + with io.open(path, 'rb') as f: + buf = f.read() + sha512.update(buf) + blake2.update(buf) + size = len(buf) + + return ('{} {} {} BLAKE2B {} SHA512 {}'.format(t, relpath, + size, blake2.hexdigest(), sha512.hexdigest())).encode('utf8') + + +def generate_manifest_entries(out, topdir): + compat_mode = False + + for dirpath, dirs, files in os.walk(topdir): + if dirpath != topdir: + for f in files: + if f.startswith('Manifest'): + fp = os.path.join(dirpath, f) + out.append(get_manifest_entry('MANIFEST', + fp, os.path.relpath(fp, topdir))) + # do not descend + dirs.clear() + skip = True + break + else: + skip = False + if skip: + continue + else: + # enable compat mode for ebuild directories + if any(f.endswith('.ebuild') for f in files): + compat_mode = True + + # skip dot-dirs + dotdirs = [d for d in dirs if d.startswith('.')] + for d in dotdirs: + dirs.remove(d) + + for f in files: + if f.startswith('Manifest') or f.startswith('.'): + continue + fp = os.path.join(dirpath, f) + ep = os.path.relpath(fp, topdir) + ftype = 'DATA' + if compat_mode: + if f.endswith('.ebuild') and f != 'skel.ebuild': + ftype = 'EBUILD' + elif f == 'metadata.xml': + ftype = 'MISC' + elif ep.startswith('files/'): + ftype = 'AUX' + ep = ep[6:] + else: + if f in ('timestamp', 'timestamp.chk', 'timestamp.commit', + 'timestamp.x'): + continue + + out.append(get_manifest_entry(ftype, fp, ep)) + + return compat_mode + + +def gen_manifest(top_dir): + manifest_entries = [] + + # load DIST and IGNORE entries from existing Manifest + had_manifest = False + try: + with io.open(os.path.join(top_dir, 'Manifest'), 'rb') as f: + for l in f: + if l.startswith(b'DIST') or l.startswith(b'IGNORE'): + manifest_entries.append(l.rstrip()) + except OSError as e: + if e.errno != errno.ENOENT: + raise + else: + had_manifest = True + + # generate local file entries + compat_mode = generate_manifest_entries(manifest_entries, top_dir) + manifest_entries.sort() + + manifest_data = b'\n'.join(manifest_entries) + b'\n' + if len(manifest_data) > 4096 and not compat_mode: + with gzip.GzipFile(os.path.join(top_dir, 'Manifest.gz'), 'wb') as f: + f.write(manifest_data) + if had_manifest: + os.unlink(os.path.join(top_dir, 'Manifest')) + else: + with io.open(os.path.join(top_dir, 'Manifest'), 'wb') as f: + f.write(manifest_data) + + +if __name__ == '__main__': + if len(sys.argv) < 2: + print('Usage: {} ...'.format(sys.argv[0])) + sys.exit(1) + + for path in sys.argv[1:]: + gen_manifest(path) -- cgit v1.2.3