mirror of
https://github.com/deepset-ai/haystack.git
synced 2025-06-26 22:00:13 +00:00
50 lines
1.5 KiB
Python
50 lines
1.5 KiB
Python
from pathlib import Path
|
|
from typing import Iterator
|
|
|
|
import ast
|
|
import hashlib
|
|
|
|
|
|
def docstrings_checksum(python_files: Iterator[Path]):
|
|
files_content = (f.read_text() for f in python_files)
|
|
trees = (ast.parse(c) for c in files_content)
|
|
|
|
# Get all docstrings from async functions, functions,
|
|
# classes and modules definitions
|
|
docstrings = []
|
|
for tree in trees:
|
|
for node in ast.walk(tree):
|
|
if not isinstance(node, (ast.AsyncFunctionDef, ast.FunctionDef, ast.ClassDef, ast.Module)):
|
|
# Skip all node types that can't have docstrings to prevent failures
|
|
continue
|
|
docstring = ast.get_docstring(node)
|
|
if docstring:
|
|
docstrings.append(docstring)
|
|
|
|
# Sort them to be safe, since ast.walk() returns
|
|
# nodes in no specified order.
|
|
# See https://docs.python.org/3/library/ast.html#ast.walk
|
|
docstrings.sort()
|
|
|
|
return hashlib.md5(str(docstrings).encode("utf-8")).hexdigest()
|
|
|
|
|
|
if __name__ == "__main__":
|
|
import argparse
|
|
|
|
parser = argparse.ArgumentParser()
|
|
parser.add_argument("--root", help="Haystack root folder", required=True, type=Path)
|
|
args = parser.parse_args()
|
|
|
|
# Get all Haystack and rest_api python files
|
|
root: Path = args.root.absolute()
|
|
haystack_files = root.glob("haystack/**/*.py")
|
|
rest_api_files = root.glob("rest_api/**/*.py")
|
|
|
|
import itertools
|
|
|
|
python_files = itertools.chain(haystack_files, rest_api_files)
|
|
|
|
md5 = docstrings_checksum(python_files)
|
|
print(md5)
|