3@file audit_function_docs.py
4@brief Audits C and Python function documentation coverage across the repository.
6This script enforces the repository's function-level documentation contract for:
8- public C declarations in `include/`,
9- C definitions in `src/` and `tests/c/`,
10- Python functions in `scripts/`, `tests/`, and Python-backed executable scripts.
12It is intentionally lightweight. The C side uses signature scanning instead of a
13full parser, while the Python side uses `ast`.
16from __future__
import annotations
21from dataclasses
import dataclass
22from pathlib
import Path
25REPO_ROOT = Path(__file__).resolve().parents[1]
27C_HEADER_DIRS = (REPO_ROOT /
"include",)
28C_SOURCE_DIRS = (REPO_ROOT /
"src", REPO_ROOT /
"tests" /
"c")
29PYTHON_DIRS = (REPO_ROOT /
"scripts", REPO_ROOT /
"tests")
31 REPO_ROOT /
"scripts" /
"picurv",
32 REPO_ROOT /
"scripts" /
"grid.gen",
35C_DECL_START_RE = re.compile(
36 r"^\s*(?!typedef\b)(?!if\b)(?!for\b)(?!while\b)(?!switch\b)(?!return\b)(?!else\b)"
37 r"(?:extern\s+)?(?:static\s+)?(?:inline\s+)?(?:const\s+)?(?:unsigned\s+|signed\s+)?"
38 r"(?:[A-Za-z_][A-Za-z0-9_]*\s+)+(?:\*\s*)*"
39 r"([A-Za-z_][A-Za-z0-9_]*)\s*\("
41C_PARAM_RE = re.compile(
r"@param(?:\[[^\]]+\])?\s+([A-Za-z_][A-Za-z0-9_]*)")
44@dataclass(frozen=True)
47 @brief Represents one audit failure.
48 @param[in] path Repository-relative path containing the failure.
49 @param[in] line 1-based source line associated with the failure.
50 @param[in] symbol Function symbol being audited.
51 @param[in] message Human-readable failure description.
62 @brief Returns all C or header files below the configured directories.
63 @param[in] directories Root directories to scan.
64 @return Sorted list of matching file paths.
67 files: list[Path] = []
68 for directory
in directories:
69 if not directory.exists():
71 files.extend(sorted(path
for path
in directory.rglob(
"*")
if path.suffix
in {
".c",
".h"}))
77 @brief Returns all Python source files covered by the audit.
78 @return Sorted list of Python-backed source files.
81 files: set[Path] = set()
82 for directory
in PYTHON_DIRS:
83 if not directory.exists():
85 files.update(path
for path
in directory.rglob(
"*.py"))
87 for path
in PYTHON_EXTRA_FILES:
96 @brief Reads a text file into a list of lines.
97 @param[in] path Path to read.
98 @return File contents split into lines without trailing newline markers.
101 return path.read_text(encoding=
"utf-8", errors=
"ignore").splitlines()
106 @brief Returns a repository-relative path string.
107 @param[in] path Absolute or repository-local path.
108 @return POSIX-style repository-relative path.
111 return path.relative_to(REPO_ROOT).as_posix()
116 @brief Finds the Doxygen block immediately attached to a declaration or definition.
117 @param[in] lines File content lines.
118 @param[in] start_line 0-based line index where the symbol begins.
119 @return `(start, end)` line indices for the attached block, or `None`.
122 probe = start_line - 1
123 while probe >= 0
and lines[probe].strip() ==
"":
126 if probe < 0
or "*/" not in lines[probe]:
130 while probe >= 0
and "/**" not in lines[probe]:
141 @brief Splits a C signature parameter list into parameter names.
142 @param[in] signature Full function signature text.
143 @return Ordered list of parameter names excluding `void` and variadics.
146 start = signature.find(
"(")
147 end = signature.rfind(
")")
148 if start < 0
or end < 0
or end <= start:
151 raw = signature[start + 1:end]
152 params: list[str] = []
154 current: list[str] = []
156 if char ==
"," and depth == 0:
157 params.append(
"".join(current).strip())
166 params.append(
"".join(current).strip())
168 names: list[str] = []
170 if not param
or param ==
"void" or param ==
"...":
173 clean = re.sub(
r"\b(const|volatile|restrict|extern|static|register|inline)\b",
"", param)
174 clean = clean.strip()
175 match = re.search(
r"([A-Za-z_][A-Za-z0-9_]*)\s*(?:\[[^\]]*\]\s*)*$", clean)
177 names.append(match.group(1))
184 @brief Extracts the declared C return type prefix for one signature.
185 @param[in] signature Full function signature text.
186 @param[in] symbol Function name contained in the signature.
187 @return Normalized return-type prefix.
190 prefix = signature.split(symbol, 1)[0]
191 return " ".join(prefix.split())
196 @brief Reports whether a Doxygen `@return` tag is required for a C symbol.
197 @param[in] return_type Normalized return-type prefix.
198 @return `True` when the symbol does not return `void`.
201 stripped = return_type.replace(
"extern ",
"").replace(
"static ",
"").replace(
"inline ",
"").strip()
202 return not stripped.startswith(
"void")
207 @brief Collects C signatures from a header or source file.
208 @param[in] path File to scan.
209 @param[in] require_terminator Expected signature terminator, either `;` or `{`.
210 @return List of `(start_line, symbol, signature_text)` tuples.
214 signatures: list[tuple[int, str, str]] = []
216 in_block_comment =
False
218 while line_index < len(lines):
219 stripped = lines[line_index].lstrip()
221 if "*/" in lines[line_index]:
222 in_block_comment =
False
226 if "/*" in lines[line_index]:
227 if "*/" not in lines[line_index]:
228 in_block_comment =
True
232 if stripped.startswith((
"#",
"/*",
"*",
"//"))
or "(" not in lines[line_index]:
236 match = C_DECL_START_RE.match(lines[line_index])
241 symbol = match.group(1)
242 start_line = line_index
243 signature = lines[line_index].rstrip()
244 while line_index + 1 < len(lines)
and require_terminator
not in signature
and ";" not in signature:
246 signature +=
" " + lines[line_index].strip()
248 if require_terminator ==
";" and ";" in signature:
249 signatures.append((start_line, symbol, signature))
250 elif require_terminator ==
"{" and "{" in signature
and ";" not in signature.split(
"{", 1)[0]:
251 signatures.append((start_line, symbol, signature))
260 @brief Audits public C declarations in one header file.
261 @param[in] path Header file to scan.
262 @return Findings emitted for the header.
265 findings: list[AuditFinding] = []
269 if block_range
is None:
273 block =
"\n".join(lines[block_range[0]:block_range[1] + 1])
274 if "@brief" not in block:
278 documented_params = set(C_PARAM_RE.findall(block))
279 if set(declared_params) != documented_params:
285 f
"documented @param names {sorted(documented_params)} do not match declaration {declared_params}",
297 @brief Audits function definitions in one C source file.
298 @param[in] path Source file to scan.
299 @return Findings emitted for the source file.
302 findings: list[AuditFinding] = []
306 if block_range
is None:
310 block =
"\n".join(lines[block_range[0]:block_range[1] + 1])
311 if "@brief" not in block:
319 @brief Returns the meaningful Python parameter names for one function node.
320 @param[in] node Function AST node.
321 @return Ordered list of parameters expected in `@param` tags.
324 names = [arg.arg
for arg
in node.args.posonlyargs + node.args.args + node.args.kwonlyargs]
325 names = [name
for name
in names
if name
not in {
"self",
"cls"}]
326 if node.args.vararg
is not None:
327 names.append(node.args.vararg.arg)
328 if node.args.kwarg
is not None:
329 names.append(node.args.kwarg.arg)
335 @brief Reports whether one Python function should document a return value.
336 @param[in] node Function AST node.
337 @return `True` when the function returns a non-`None` value.
340 for child
in ast.walk(node):
341 if isinstance(child, ast.Return)
and child.value
is not None:
342 if isinstance(child.value, ast.Constant)
and child.value.value
is None:
350 @brief Audits Python function docstrings in one file.
351 @param[in] path Python source file to scan.
352 @return Findings emitted for the Python file.
355 findings: list[AuditFinding] = []
356 source = path.read_text(encoding=
"utf-8")
357 tree = ast.parse(source, filename=str(path))
359 for node
in ast.walk(tree):
360 if not isinstance(node, (ast.FunctionDef, ast.AsyncFunctionDef)):
363 docstring = ast.get_docstring(node)
364 if docstring
is None:
368 if "@brief" not in docstring:
372 documented_params = set(re.findall(
r"@param(?:\[[^\]]+\])?\s+([A-Za-z_][A-Za-z0-9_]*)", docstring))
373 if set(declared_params) != documented_params:
379 f
"documented @param names {sorted(documented_params)} do not match declaration {declared_params}",
391 @brief Runs the full repository documentation audit.
392 @return Sorted list of all findings emitted by the audit.
395 findings: list[AuditFinding] = []
399 if path.suffix ==
".c":
404 return sorted(findings, key=
lambda item: (item.path, item.line, item.symbol, item.message))
409 @brief Prints findings in a grep-friendly format.
410 @param[in] findings Findings to render.
413 for finding
in findings:
414 print(f
"{finding.path}:{finding.line}: {finding.symbol}: {finding.message}")
419 @brief Runs the repository function documentation audit from the command line.
420 @return Process exit status.
426 print(f
"\nFound {len(findings)} documentation issue(s).", file=sys.stderr)
429 print(
"Function documentation audit passed.")
433if __name__ ==
"__main__":
434 raise SystemExit(
main())
Represents one audit failure.
list[str] _python_parameter_names(ast.FunctionDef|ast.AsyncFunctionDef node)
Returns the meaningful Python parameter names for one function node.
list[Path] _iter_c_files(tuple[Path,...] directories)
Returns all C or header files below the configured directories.
list[str] _read_lines(Path path)
Reads a text file into a list of lines.
list[AuditFinding] _audit_python_file(Path path)
Audits Python function docstrings in one file.
str _c_return_type(str signature, str symbol)
Extracts the declared C return type prefix for one signature.
str _relative_path(Path path)
Returns a repository-relative path string.
list[Path] _iter_python_files()
Returns all Python source files covered by the audit.
bool _return_tag_required(str return_type)
Reports whether a Doxygen @return tag is required for a C symbol.
list[str] _split_c_parameters(str signature)
Splits a C signature parameter list into parameter names.
bool _python_requires_return(ast.FunctionDef|ast.AsyncFunctionDef node)
Reports whether one Python function should document a return value.
None _print_findings(list[AuditFinding] findings)
Prints findings in a grep-friendly format.
list[AuditFinding] _audit_c_source(Path path)
Audits function definitions in one C source file.
list[tuple[int, str, str]] _collect_c_signatures(Path path, str require_terminator)
Collects C signatures from a header or source file.
list[AuditFinding] _collect_findings()
Runs the full repository documentation audit.
tuple[int, int]|None _find_attached_doxygen_block(list[str] lines, int start_line)
Finds the Doxygen block immediately attached to a declaration or definition.
list[AuditFinding] _audit_c_header(Path path)
Audits public C declarations in one header file.
int main()
Runs the repository function documentation audit from the command line.