circuitpython/tools/extract_pyi.py

277 lines
8.8 KiB
Python
Raw Normal View History

2020-06-03 23:40:05 +01:00
# SPDX-FileCopyrightText: 2014 MicroPython & CircuitPython contributors (https://github.com/adafruit/circuitpython/graphs/contributors)
#
# SPDX-License-Identifier: MIT
# Run with 'python tools/extract_pyi.py shared-bindings/ path/to/stub/dir
# You can also test a specific library in shared-bindings by putting the path
# to that directory instead
2020-07-22 00:37:22 +09:00
import ast
2020-04-27 14:36:14 -07:00
import os
2020-07-22 00:37:22 +09:00
import re
2020-04-27 14:36:14 -07:00
import sys
import traceback
2020-07-22 00:37:22 +09:00
import isort
2020-07-24 03:22:41 +09:00
import black
2020-07-22 00:37:22 +09:00
2021-03-15 19:27:36 +05:30
IMPORTS_IGNORE = frozenset(
{
"int",
"float",
"bool",
"str",
"bytes",
"tuple",
"list",
"set",
"dict",
"bytearray",
"slice",
"file",
"buffer",
"range",
"array",
"struct_time",
}
)
IMPORTS_TYPING = frozenset(
{
"Any",
2021-07-20 17:24:04 -05:00
"Dict",
2021-03-15 19:27:36 +05:30
"Optional",
"Union",
"Tuple",
"List",
"Sequence",
"NamedTuple",
"Iterable",
"Iterator",
"Callable",
"AnyStr",
"overload",
"Type",
}
)
IMPORTS_TYPES = frozenset({"TracebackType"})
CPY_TYPING = frozenset(
{"ReadableBuffer", "WriteableBuffer", "AudioSample", "FrameBuffer", "Alarm"}
)
2020-07-22 00:37:22 +09:00
2020-08-03 13:35:43 +09:00
def is_typed(node, allow_any=False):
2020-07-22 00:37:22 +09:00
if node is None:
2020-08-03 13:35:43 +09:00
return False
if allow_any:
2020-07-22 00:37:22 +09:00
return True
2020-08-03 13:35:43 +09:00
elif isinstance(node, ast.Name) and node.id == "Any":
return False
2021-03-15 19:27:36 +05:30
elif (
isinstance(node, ast.Attribute)
and type(node.value) == ast.Name
and node.value.id == "typing"
and node.attr == "Any"
):
2020-08-03 13:35:43 +09:00
return False
return True
2020-07-22 00:37:22 +09:00
2020-08-03 13:35:43 +09:00
def find_stub_issues(tree):
2020-07-22 00:37:22 +09:00
for node in ast.walk(tree):
2020-08-03 13:35:43 +09:00
if isinstance(node, ast.AnnAssign):
if not is_typed(node.annotation):
yield ("WARN", f"Missing attribute type on line {node.lineno}")
if isinstance(node.value, ast.Constant) and node.value.value == Ellipsis:
yield ("WARN", f"Unnecessary Ellipsis assignment (= ...) on line {node.lineno}.")
elif isinstance(node, ast.Assign):
if isinstance(node.value, ast.Constant) and node.value.value == Ellipsis:
yield ("WARN", f"Unnecessary Ellipsis assignment (= ...) on line {node.lineno}.")
elif isinstance(node, ast.arguments):
2020-08-08 01:33:24 +09:00
allargs = list(node.args + node.kwonlyargs)
if sys.version_info >= (3, 8):
allargs.extend(node.posonlyargs)
for arg_node in allargs:
2021-03-15 19:27:36 +05:30
if not is_typed(arg_node.annotation) and (
arg_node.arg != "self" and arg_node.arg != "cls"
):
yield (
"WARN",
f"Missing argument type: {arg_node.arg} on line {arg_node.lineno}",
)
2020-08-03 13:35:43 +09:00
if node.vararg and not is_typed(node.vararg.annotation, allow_any=True):
2021-03-15 19:27:36 +05:30
yield (
"WARN",
f"Missing argument type: *{node.vararg.arg} on line {node.vararg.lineno}",
)
2020-08-03 13:35:43 +09:00
if node.kwarg and not is_typed(node.kwarg.annotation, allow_any=True):
2021-03-15 19:27:36 +05:30
yield (
"WARN",
f"Missing argument type: **{node.kwarg.arg} on line {node.kwarg.lineno}",
)
2020-08-03 13:35:43 +09:00
elif isinstance(node, ast.FunctionDef):
if not is_typed(node.returns):
yield ("WARN", f"Missing return type: {node.name} on line {node.lineno}")
2020-07-22 00:37:22 +09:00
def extract_imports(tree):
modules = set()
typing = set()
types = set()
2020-08-03 13:35:43 +09:00
cpy_typing = set()
2020-07-22 00:37:22 +09:00
def collect_annotations(anno_tree):
if anno_tree is None:
return
for node in ast.walk(anno_tree):
2020-08-03 13:35:43 +09:00
if isinstance(node, ast.Name):
2020-07-22 00:37:22 +09:00
if node.id in IMPORTS_IGNORE:
continue
elif node.id in IMPORTS_TYPING:
typing.add(node.id)
elif node.id in IMPORTS_TYPES:
types.add(node.id)
2020-08-03 13:35:43 +09:00
elif node.id in CPY_TYPING:
cpy_typing.add(node.id)
elif isinstance(node, ast.Attribute):
if isinstance(node.value, ast.Name):
2020-07-24 03:22:41 +09:00
modules.add(node.value.id)
2020-07-22 00:37:22 +09:00
for node in ast.walk(tree):
2020-08-03 13:35:43 +09:00
if isinstance(node, (ast.AnnAssign, ast.arg)):
2020-07-22 00:37:22 +09:00
collect_annotations(node.annotation)
2020-08-03 13:35:43 +09:00
elif isinstance(node, ast.Assign):
collect_annotations(node.value)
elif isinstance(node, ast.FunctionDef):
2020-07-22 00:37:22 +09:00
collect_annotations(node.returns)
2020-07-24 03:22:41 +09:00
for deco in node.decorator_list:
2020-08-03 13:35:43 +09:00
if isinstance(deco, ast.Name) and (deco.id in IMPORTS_TYPING):
2020-07-24 03:22:41 +09:00
typing.add(deco.id)
2020-07-22 00:37:22 +09:00
return {
"modules": sorted(modules),
"typing": sorted(typing),
"types": sorted(types),
2020-08-03 13:35:43 +09:00
"cpy_typing": sorted(cpy_typing),
2020-07-22 00:37:22 +09:00
}
2020-04-27 14:36:14 -07:00
2020-08-03 13:35:43 +09:00
def find_references(tree):
for node in ast.walk(tree):
if isinstance(node, ast.arguments):
for node in ast.walk(node):
if isinstance(node, ast.Attribute):
if isinstance(node.value, ast.Name) and node.value.id[0].isupper():
yield node.value.id
2020-05-14 15:57:35 -07:00
def convert_folder(top_level, stub_directory):
ok = 0
total = 0
filenames = sorted(os.listdir(top_level))
2020-08-03 13:35:43 +09:00
stub_fragments = []
references = set()
2020-07-22 00:37:22 +09:00
2020-05-14 15:57:35 -07:00
for filename in filenames:
full_path = os.path.join(top_level, filename)
file_lines = []
if os.path.isdir(full_path):
2020-07-22 00:37:22 +09:00
(mok, mtotal) = convert_folder(full_path, os.path.join(stub_directory, filename))
2020-05-14 15:57:35 -07:00
ok += mok
total += mtotal
elif filename.endswith(".c"):
2020-08-03 13:35:43 +09:00
with open(full_path, "r", encoding="utf-8") as f:
2020-05-14 15:57:35 -07:00
for line in f:
2020-08-03 13:35:43 +09:00
line = line.rstrip()
2020-05-14 15:57:35 -07:00
if line.startswith("//|"):
2020-08-03 13:35:43 +09:00
if len(line) == 3:
line = ""
elif line[3] == " ":
2020-05-14 15:57:35 -07:00
line = line[4:]
else:
2020-08-03 13:35:43 +09:00
line = line[3:]
print("[WARN] There must be at least one space after '//|'")
2020-05-14 15:57:35 -07:00
file_lines.append(line)
elif filename.endswith(".pyi"):
with open(full_path, "r") as f:
2020-08-03 13:35:43 +09:00
file_lines.extend(line.rstrip() for line in f)
fragment = "\n".join(file_lines).strip()
try:
tree = ast.parse(fragment)
except SyntaxError as e:
print(f"[ERROR] Failed to parse a Python stub from {full_path}")
traceback.print_exception(type(e), e, e.__traceback__)
return (ok, total + 1)
references.update(find_references(tree))
if fragment:
name = os.path.splitext(os.path.basename(filename))[0]
if name == "__init__" or (name in references):
stub_fragments.insert(0, fragment)
else:
stub_fragments.append(fragment)
if not stub_fragments:
2020-07-22 00:37:22 +09:00
return (ok, total)
2020-05-14 15:57:35 -07:00
stub_filename = os.path.join(stub_directory, "__init__.pyi")
2020-04-27 14:36:14 -07:00
print(stub_filename)
2020-08-03 13:35:43 +09:00
stub_contents = "\n\n".join(stub_fragments)
2020-04-27 14:36:14 -07:00
2020-08-03 13:35:43 +09:00
# Validate the stub code.
2020-04-27 14:36:14 -07:00
try:
2020-07-22 00:37:22 +09:00
tree = ast.parse(stub_contents)
except SyntaxError as e:
2020-04-27 14:36:14 -07:00
traceback.print_exception(type(e), e, e.__traceback__)
2020-07-22 00:37:22 +09:00
return (ok, total)
2020-08-03 13:35:43 +09:00
error = False
for (level, msg) in find_stub_issues(tree):
if level == "ERROR":
error = True
print(f"[{level}] {msg}")
total += 1
if not error:
ok += 1
2020-07-22 00:37:22 +09:00
# Add import statements
2020-08-03 13:35:43 +09:00
imports = extract_imports(tree)
2020-07-22 00:37:22 +09:00
import_lines = ["from __future__ import annotations"]
if imports["types"]:
import_lines.append("from types import " + ", ".join(imports["types"]))
2020-07-24 03:22:41 +09:00
if imports["typing"]:
import_lines.append("from typing import " + ", ".join(imports["typing"]))
2020-08-03 13:35:43 +09:00
if imports["cpy_typing"]:
import_lines.append("from circuitpython_typing import " + ", ".join(imports["cpy_typing"]))
2020-07-22 00:37:22 +09:00
import_lines.extend(f"import {m}" for m in imports["modules"])
import_body = "\n".join(import_lines)
m = re.match(r'(\s*""".*?""")', stub_contents, flags=re.DOTALL)
if m:
2021-03-15 19:27:36 +05:30
stub_contents = m.group(1) + "\n\n" + import_body + "\n\n" + stub_contents[m.end() :]
2020-07-22 00:37:22 +09:00
else:
stub_contents = import_body + "\n\n" + stub_contents
2020-07-24 03:22:41 +09:00
# Code formatting
stub_contents = isort.code(stub_contents)
stub_contents = black.format_str(stub_contents, mode=black.FileMode(is_pyi=True))
2020-07-22 00:37:22 +09:00
os.makedirs(stub_directory, exist_ok=True)
with open(stub_filename, "w") as f:
f.write(stub_contents)
return (ok, total)
if __name__ == "__main__":
top_level = sys.argv[1].strip("/")
stub_directory = sys.argv[2]
2020-05-14 15:57:35 -07:00
2020-07-22 00:37:22 +09:00
(ok, total) = convert_folder(top_level, stub_directory)
2020-04-27 14:36:14 -07:00
2020-07-22 00:37:22 +09:00
print(f"Parsing .pyi files: {total - ok} failed, {ok} passed")
2020-07-22 00:37:22 +09:00
if ok != total:
sys.exit(total - ok)