utils: add a method to calculate the hash of a directory

Signed-off-by:  Eric Callahan <arksine.code@gmail.com>
This commit is contained in:
Eric Callahan 2021-06-18 19:11:09 -04:00
parent 5379e4b4bd
commit ebaac290e7
1 changed files with 27 additions and 0 deletions

View File

@ -11,10 +11,12 @@ import os
import sys import sys
import subprocess import subprocess
import asyncio import asyncio
import hashlib
from queue import SimpleQueue as Queue from queue import SimpleQueue as Queue
# Annotation imports # Annotation imports
from typing import ( from typing import (
List,
Optional, Optional,
ClassVar, ClassVar,
Tuple, Tuple,
@ -122,3 +124,28 @@ def setup_logging(log_file: str,
queue, stdout_hdlr) queue, stdout_hdlr)
listener.start() listener.start()
return listener, file_hdlr return listener, file_hdlr
def hash_directory(dir_path: str,
ignore_exts: List[str],
ignore_dirs: List[str]
) -> str:
checksum = hashlib.blake2s()
if not os.path.exists(dir_path):
return ""
for dpath, dnames, fnames in os.walk(dir_path):
valid_dirs: List[str] = []
for dname in sorted(dnames):
if dname[0] == '.' or dname in ignore_dirs:
continue
valid_dirs.append(dname)
dnames[:] = valid_dirs
for fname in sorted(fnames):
ext = os.path.splitext(fname)[-1].lower()
if fname[0] == '.' or ext in ignore_exts:
continue
fpath = pathlib.Path(os.path.join(dpath, fname))
try:
checksum.update(fpath.read_bytes())
except Exception:
pass
return checksum.hexdigest()