diff options
Diffstat (limited to 'json4cpp/docs/mkdocs/scripts/check_structure.py')
| -rwxr-xr-x | json4cpp/docs/mkdocs/scripts/check_structure.py | 222 |
1 files changed, 222 insertions, 0 deletions
diff --git a/json4cpp/docs/mkdocs/scripts/check_structure.py b/json4cpp/docs/mkdocs/scripts/check_structure.py new file mode 100755 index 0000000000..c8d637d06b --- /dev/null +++ b/json4cpp/docs/mkdocs/scripts/check_structure.py @@ -0,0 +1,222 @@ +#!/usr/bin/env python + +import glob +import os.path +import re +import sys + +import yaml + +warnings = 0 + + +def report(rule, location, description) -> None: + global warnings + warnings += 1 + print(f'{warnings:3}. {location}: {description} [{rule}]') + + +def check_structure() -> None: + expected_sections = [ + "Template parameters", + "Specializations", + "Iterator invalidation", + "Requirements", + "Member types", + "Member functions", + "Member variables", + "Static functions", + "Non-member functions", + "Literals", + "Helper classes", + "Parameters", + "Return value", + "Exception safety", + "Exceptions", + "Complexity", + "Possible implementation", + "Default definition", + "Notes", + "Examples", + "See also", + "Version history", + ] + + required_sections = [ + "Examples", + "Version history", + ] + + files = sorted(glob.glob("api/**/*.md", recursive=True)) + for file in files: + with open(file) as file_content: + section_idx = -1 # the index of the current h2 section + existing_sections = [] # the list of h2 sections in the file + in_initial_code_example = False # whether we are inside the first code example block + previous_line = None # the previous read line + h1sections = 0 # the number of h1 sections in the file + last_overload = 0 # the last seen overload number in the code example + documented_overloads = {} # the overloads that have been documented in the current block + current_section = None # the name of the current section + + for lineno, original_line in enumerate(file_content.readlines()): + line = original_line.strip() + + if line.startswith("# "): + h1sections += 1 + + # there should only be one top-level title + if h1sections > 1: + report("structure/unexpected_section", f"{file}:{lineno+1}", f'unexpected top-level title "{line}"') + h1sections = 1 + + # Overview pages should have a better title + if line == "# Overview": + report("style/title", f"{file}:{lineno+1}", 'overview pages should have a better title than "Overview"') + + # lines longer than 160 characters are bad (unless they are tables) + if len(line) > 160 and "|" not in line: + report("whitespace/line_length", f"{file}:{lineno+1} ({current_section})", f"line is too long ({len(line)} vs. 160 chars)") + + # sections in `<!-- NOLINT -->` comments are treated as present + if line.startswith("<!-- NOLINT"): + current_section = line.strip("<!-- NOLINT") + current_section = current_section.strip(" -->") + existing_sections.append(current_section) + + # check if sections are correct + if line.startswith("## "): + # before starting a new section, check if the previous one documented all overloads + if current_section in documented_overloads and last_overload != 0: + if len(documented_overloads[current_section]) > 0 and len(documented_overloads[current_section]) != last_overload: + expected = list(range(1, last_overload+1)) + undocumented = [x for x in expected if x not in documented_overloads[current_section]] + unexpected = [x for x in documented_overloads[current_section] if x not in expected] + if len(undocumented): + report("style/numbering", f"{file}:{lineno} ({current_section})", f'undocumented overloads: {", ".join([f"({x})" for x in undocumented])}') + if len(unexpected): + report("style/numbering", f"{file}:{lineno} ({current_section})", f'unexpected overloads: {", ".join([f"({x})" for x in unexpected])}') + + current_section = line.strip("## ") + existing_sections.append(current_section) + + if current_section in expected_sections: + idx = expected_sections.index(current_section) + if idx <= section_idx: + report("structure/section_order", f"{file}:{lineno+1}", f'section "{current_section}" is in an unexpected order (should be before "{expected_sections[section_idx]}")') + section_idx = idx + elif "index.md" not in file: # index.md files may have a different structure + report("structure/unknown_section", f"{file}:{lineno+1}", f'section "{current_section}" is not part of the expected sections') + + # collect the numbered items of the current section to later check if they match the number of overloads + if last_overload != 0 and not in_initial_code_example: + if len(original_line) and original_line[0].isdigit(): + number = int(re.findall(r"^(\d+).", original_line)[0]) + if current_section not in documented_overloads: + documented_overloads[current_section] = [] + documented_overloads[current_section].append(number) + + # code example + if line == "```cpp" and section_idx == -1: + in_initial_code_example = True + + if in_initial_code_example and line.startswith("//") and line not in ["// since C++20", "// until C++20"]: + # check numbering of overloads + if any(map(str.isdigit, line)): + number = int(re.findall(r"\d+", line)[0]) + if number != last_overload + 1: + report("style/numbering", f"{file}:{lineno+1}", f"expected number ({number}) to be ({last_overload +1 })") + last_overload = number + + if any(map(str.isdigit, line)) and "(" not in line: + report("style/numbering", f"{file}:{lineno+1}", f"number should be in parentheses: {line}") + + if line == "```" and in_initial_code_example: + in_initial_code_example = False + + # consecutive blank lines are bad + if line == "" and previous_line == "": + report("whitespace/blank_lines", f"{file}:{lineno}-{lineno+1} ({current_section})", "consecutive blank lines") + + # check that non-example admonitions have titles + untitled_admonition = re.match(r"^(\?\?\?|!!!) ([^ ]+)$", line) + if untitled_admonition and untitled_admonition.group(2) != "example": + report("style/admonition_title", f"{file}:{lineno} ({current_section})", f'"{untitled_admonition.group(2)}" admonitions should have a title') + + previous_line = line + + if "index.md" not in file: # index.md files may have a different structure + for required_section in required_sections: + if required_section not in existing_sections: + report("structure/missing_section", f"{file}:{lineno+1}", f'required section "{required_section}" was not found') + + +def check_examples() -> None: + example_files = sorted(glob.glob("../../examples/*.cpp")) + markdown_files = sorted(glob.glob("**/*.md", recursive=True)) + + # check if every example file is used in at least one markdown file + for example_file in example_files: + example_file = os.path.join("examples", os.path.basename(example_file)) + + found = False + for markdown_file in markdown_files: + content = " ".join(open(markdown_file).readlines()) + if example_file in content: + found = True + break + + if not found: + report("examples/missing", f"{example_file}", "example file is not used in any documentation file") + + +def check_links() -> None: + """Check that every entry in the navigation (nav in mkdocs.yml) links to at most one file. If a file is linked more + than once, then the first entry is repeated. See https://github.com/nlohmann/json/issues/4564 for the issue in + this project and https://github.com/mkdocs/mkdocs/issues/3428 for the root cause. + + The issue can be fixed by merging the keys, so + + - 'NLOHMANN_JSON_VERSION_MAJOR': api/macros/nlohmann_json_version_major.md + - 'NLOHMANN_JSON_VERSION_MINOR': api/macros/nlohmann_json_version_major.md + + would be replaced with + + - 'NLOHMANN_JSON_VERSION_MAJOR, NLOHMANN_JSON_VERSION_MINOR': api/macros/nlohmann_json_version_major.md + """ + file_with_path = {} + + def collect_links(node, path="") -> None: + if isinstance(node, list): + for x in node: + collect_links(x, path) + elif isinstance(node, dict): + for p, x in node.items(): + collect_links(x, path + "/" + p) + else: + if node not in file_with_path: + file_with_path[node] = [] + file_with_path[node].append(path) + + with open("../mkdocs.yml") as mkdocs_file: + # see https://github.com/yaml/pyyaml/issues/86#issuecomment-1042485535 + yaml.add_multi_constructor("tag:yaml.org,2002:python/name", lambda loader, suffix, node: None, Loader=yaml.SafeLoader) + yaml.add_multi_constructor("!ENV", lambda loader, suffix, node: None, Loader=yaml.SafeLoader) + y = yaml.safe_load(mkdocs_file) + + collect_links(y["nav"]) + for duplicate_file in [x for x in file_with_path if len(file_with_path[x]) > 1]: + file_list = [f'"{x}"' for x in file_with_path[duplicate_file]] + file_list_str = ", ".join(file_list) + report("nav/duplicate_files", "mkdocs.yml", f'file "{duplicate_file}" is linked with multiple keys in "nav": {file_list_str}; only one is rendered properly, see #4564') + + +if __name__ == "__main__": + print(120 * "-") + check_structure() + check_examples() + check_links() + print(120 * "-") + + if warnings > 0: + sys.exit(1) |
