Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Implementing mypyc support pt. 2 #2431

Merged
merged 28 commits into from
Nov 16, 2021
Merged
Show file tree
Hide file tree
Changes from 18 commits
Commits
Show all changes
28 commits
Select commit Hold shift + click to select a range
9531e1b
Initial mypyc support changes
ichard26 Jun 6, 2021
6e9e0fb
Make the test suite usable for testing
ichard26 Jun 6, 2021
acb77f7
Fix mypyc KeyError on src/black/parsing.py
ichard26 Jun 12, 2021
a37fb77
Saves ~100 kB on my Linux machine :)
ichard26 Jun 30, 2021
2ccc774
Strings specific micro-optimization (1-10% perf boost)
ichard26 Jun 30, 2021
6f60e6e
Looks like I'll be marking more and more tests
ichard26 Jul 1, 2021
f508be4
Fix mypyc + Black on Windows
ichard26 Jul 10, 2021
94dcddb
Ask mypy to warn on unreachable code
ichard26 Jul 10, 2021
57a25ed
Clean up mypyc setup in setup.py
ichard26 Jul 10, 2021
8f42f28
Merge branch 'main' into mypyc-support-pt2
ichard26 Jul 17, 2021
f6a3e78
Initial mypyc optimizations - 5% faster parsing
ichard26 Jul 27, 2021
911d0d8
More parsing optimizations - 4% faster
ichard26 Jul 27, 2021
1f0df05
Just some cleanup
ichard26 Jul 31, 2021
58fbe9c
--version now indicates whether black is compiled
ichard26 Aug 1, 2021
c7de2ea
Round 3 of optimizations - 95% black + 5% blib2to3
ichard26 Aug 3, 2021
b956802
Merge branch 'main' into mypyc-support-pt2
ichard26 Aug 8, 2021
eaa4f6c
Fix crashes and errors since merge from main
ichard26 Aug 7, 2021
e9834e0
Mild hack so mypyc doesn't break diff-shades + cleanup
ichard26 Aug 11, 2021
f103dc0
Address feedback & cleanup comments
ichard26 Aug 21, 2021
5fc39fe
Merge branch 'main' into mypyc-support-pt2
ichard26 Oct 28, 2021
2f238ca
Skip a few more monkeypatching tests
ichard26 Oct 28, 2021
f561b0c
Bring back ignore for unused type ignore
ichard26 Oct 28, 2021
11b4f09
Merge branch 'main' into mypyc-support-pt2
ichard26 Oct 30, 2021
b0b3709
Merge branch 'main' into mypyc-support-pt2
ichard26 Oct 31, 2021
bb86dcf
Merge branch 'main' into mypyc-support-pt2
ichard26 Nov 14, 2021
5ef46f4
Optimizations + compatiblity fixes
ichard26 Nov 14, 2021
7c52cdb
Merge branch 'main' into mypyc-support-pt2
ichard26 Nov 14, 2021
f5f1099
Fix crash on PyPy by deoptimizing :(
ichard26 Nov 16, 2021
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
21 changes: 20 additions & 1 deletion mypy.ini
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,6 @@
# free to run mypy on Windows, Linux, or macOS and get consistent
# results.
python_version=3.6
platform=linux

show_column_numbers=True

Expand All @@ -23,6 +22,10 @@ warn_unused_ignores=True
# Until we're not supporting 3.6 primer needs this
disallow_any_generics=False

# Unreachable blocks have been an issue when compiling mypyc, let's try
# to avoid 'em in the first place.
warn_unreachable=True

# The following are off by default. Flip them on if you feel
# adventurous.
disallow_untyped_defs=True
Expand All @@ -33,7 +36,23 @@ cache_dir=/dev/null

[mypy-aiohttp.*]
follow_imports=skip

[mypy-black]
# The following is because of `patch_click()`. Remove when
# we drop Python 3.6 support.
warn_unused_ignores=False

[mypy-black.files]
# Unfortunately tomli has deprecated strings and changed the API type
# annotations to bytes all while strings still work. We still use strings
# since it's unclear whether this will last (depends on how much the
# TOML people like bare CR as a newline sequence I suppose). Anyway,
# some versions of tomli still specify str as the type so mypy complains
# that the type: ignore is unnecessary. Gosh I wish I wasn't telling
# this story.
#
# See also: https://github.com/psf/black/pull/2408
# https://github.com/pypa/pip/pull/10238 (because black is
# following whatever they do)
# https://github.com/toml-lang/toml/issues/837
warn_unused_ignores=False
ichard26 marked this conversation as resolved.
Show resolved Hide resolved
3 changes: 3 additions & 0 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -33,3 +33,6 @@ optional-tests = [
"no_blackd: run when `d` extra NOT installed",
"no_jupyter: run when `jupyter` extra NOT installed",
]
markers = [
"incompatible_with_mypyc: run when testing mypyc compiled black"
]
47 changes: 36 additions & 11 deletions setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@

assert sys.version_info >= (3, 6, 2), "black requires Python 3.6.2+"
from pathlib import Path # noqa E402
from typing import List # noqa: E402

CURRENT_DIR = Path(__file__).parent
sys.path.insert(0, str(CURRENT_DIR)) # for setuptools.build_meta
Expand All @@ -18,6 +19,17 @@ def get_long_description() -> str:
)


def find_python_files(base: Path) -> List[Path]:
files = []
for entry in base.iterdir():
if entry.is_file() and entry.suffix == ".py":
files.append(entry)
elif entry.is_dir():
files.extend(find_python_files(entry))

return files


USE_MYPYC = False
# To compile with mypyc, a mypyc checkout must be present on the PYTHONPATH
if len(sys.argv) > 1 and sys.argv[1] == "--use-mypyc":
Expand All @@ -27,21 +39,34 @@ def get_long_description() -> str:
USE_MYPYC = True

if USE_MYPYC:
from mypyc.build import mypycify

src = CURRENT_DIR / "src"
# TIP: filepaths are normalized to use forward slashes and are relative to ./src/
# before being checked against.
blocklist = [
# Not performance sensitive, so save bytes + compilation time:
"blib2to3/__init__.py",
"blib2to3/pgen2/__init__.py",
"black/output.py",
"black/concurrency.py",
"black/files.py",
"black/report.py",
# Breaks the test suite when compiled (and is also useless):
"black/debug.py",
# Compiled modules can't be run directly and that's a problem here:
"black/__main__.py",
]
discovered = []
# black-primer and blackd have no good reason to be compiled.
discovered.extend(find_python_files(src / "black"))
discovered.extend(find_python_files(src / "blib2to3"))
mypyc_targets = [
"src/black/__init__.py",
"src/blib2to3/pytree.py",
"src/blib2to3/pygram.py",
"src/blib2to3/pgen2/parse.py",
"src/blib2to3/pgen2/grammar.py",
"src/blib2to3/pgen2/token.py",
"src/blib2to3/pgen2/driver.py",
"src/blib2to3/pgen2/pgen.py",
str(p) for p in discovered if p.relative_to(src).as_posix() not in blocklist
]

from mypyc.build import mypycify

opt_level = os.getenv("MYPYC_OPT_LEVEL", "3")
ext_modules = mypycify(mypyc_targets, opt_level=opt_level)
ext_modules = mypycify(mypyc_targets, opt_level=opt_level, verbose=True)
else:
ext_modules = []

Expand Down
19 changes: 15 additions & 4 deletions src/black/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,8 +29,9 @@
Union,
)

from dataclasses import replace
import click
from dataclasses import replace
from mypy_extensions import mypyc_attr

from black.const import DEFAULT_LINE_LENGTH, DEFAULT_INCLUDES, DEFAULT_EXCLUDES
from black.const import STDIN_PLACEHOLDER
Expand Down Expand Up @@ -65,6 +66,8 @@

from _black_version import version as __version__

COMPILED = Path(__file__).suffix in (".pyd", ".so")

# types
FileContent = str
Encoding = str
Expand Down Expand Up @@ -174,7 +177,10 @@ def validate_regex(
raise click.BadParameter("Not a valid regular expression")


@click.command(context_settings=dict(help_option_names=["-h", "--help"]))
@click.command(
context_settings=dict(help_option_names=["-h", "--help"]),
help="The uncompromising code formatter.",
)
@click.option("-c", "--code", type=str, help="Format the code passed in as a string.")
@click.option(
"-l",
Expand Down Expand Up @@ -335,7 +341,10 @@ def validate_regex(
" due to exclusion patterns."
),
)
@click.version_option(version=__version__)
@click.version_option(
version=__version__,
message=f"%(prog)s, %(version)s (compiled: {'yes' if COMPILED else 'no'})",
)
@click.argument(
"src",
nargs=-1,
Expand Down Expand Up @@ -376,7 +385,7 @@ def main(
experimental_string_processing: bool,
quiet: bool,
verbose: bool,
required_version: str,
required_version: Optional[str],
include: Pattern,
exclude: Optional[Pattern],
extend_exclude: Optional[Pattern],
Expand Down Expand Up @@ -639,6 +648,7 @@ def reformat_one(
report.failed(src, str(exc))


@mypyc_attr(patchable=True)
def reformat_many(
sources: Set[Path], fast: bool, write_back: WriteBack, mode: Mode, report: "Report"
) -> None:
Expand All @@ -648,6 +658,7 @@ def reformat_many(
worker_count = os.cpu_count()
if sys.platform == "win32":
# Work around https://bugs.python.org/issue26903
assert worker_count is not None
worker_count = min(worker_count, 60)
try:
executor = ProcessPoolExecutor(max_workers=worker_count)
Expand Down
4 changes: 3 additions & 1 deletion src/black/brackets.py
Original file line number Diff line number Diff line change
Expand Up @@ -49,7 +49,9 @@
DOT_PRIORITY: Final = 1


class BracketMatchError(KeyError):
# Ideally this would be a subclass of KeyError, but mypyc doesn't like that.
ichard26 marked this conversation as resolved.
Show resolved Hide resolved
# See also: https://mypyc.readthedocs.io/en/latest/native_classes.html#inheritance.
class BracketMatchError(Exception):
"""Raised when an opening bracket is unable to be matched to a closing bracket."""


Expand Down
15 changes: 10 additions & 5 deletions src/black/comments.py
Original file line number Diff line number Diff line change
@@ -1,8 +1,14 @@
import sys
from dataclasses import dataclass
from functools import lru_cache
import regex as re
from typing import Iterator, List, Optional, Union

if sys.version_info >= (3, 8):
from typing import Final
else:
from typing_extensions import Final

from blib2to3.pytree import Node, Leaf
from blib2to3.pgen2 import token

Expand All @@ -12,11 +18,10 @@
# types
LN = Union[Leaf, Node]


FMT_OFF = {"# fmt: off", "# fmt:off", "# yapf: disable"}
FMT_SKIP = {"# fmt: skip", "# fmt:skip"}
FMT_PASS = {*FMT_OFF, *FMT_SKIP}
FMT_ON = {"# fmt: on", "# fmt:on", "# yapf: enable"}
FMT_OFF: Final = {"# fmt: off", "# fmt:off", "# yapf: disable"}
FMT_SKIP: Final = {"# fmt: skip", "# fmt:skip"}
FMT_PASS: Final = {*FMT_OFF, *FMT_SKIP}
FMT_ON: Final = {"# fmt: on", "# fmt:on", "# yapf: enable"}


@dataclass
Expand Down
2 changes: 2 additions & 0 deletions src/black/files.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@
TYPE_CHECKING,
)

from mypy_extensions import mypyc_attr
from pathspec import PathSpec
import tomli

Expand Down Expand Up @@ -87,6 +88,7 @@ def find_pyproject_toml(path_search_start: Tuple[str, ...]) -> Optional[str]:
return None


@mypyc_attr(patchable=True)
def parse_pyproject_toml(path_config: str) -> Dict[str, Any]:
"""Parse a pyproject toml file, pulling out relevant parts for Black

Expand Down
13 changes: 7 additions & 6 deletions src/black/handle_ipynb_magics.py
Original file line number Diff line number Diff line change
Expand Up @@ -312,7 +312,7 @@ class CellMagic:
body: str


@dataclasses.dataclass
# ast.NodeVisitor + dataclass = breakage under mypyc.
class CellMagicFinder(ast.NodeVisitor):
"""Find cell magics.

Expand All @@ -331,7 +331,8 @@ class CellMagicFinder(ast.NodeVisitor):
and we look for instances of the latter.
"""

cell_magic: Optional[CellMagic] = None
def __init__(self, cell_magic: Optional[CellMagic] = None) -> None:
self.cell_magic = cell_magic

def visit_Expr(self, node: ast.Expr) -> None:
"""Find cell magic, extract header and body."""
Expand All @@ -357,7 +358,8 @@ class OffsetAndMagic:
magic: str


@dataclasses.dataclass
# Unsurprisingly, dataclasses are Not. An. Option. Here. Due. To. Mypyc. As. Usual.
# > fyi it's due the ast.NodeVisitor parent type
class MagicFinder(ast.NodeVisitor):
"""Visit cell to look for get_ipython calls.

Expand All @@ -377,9 +379,8 @@ class MagicFinder(ast.NodeVisitor):
types of magics).
"""

magics: Dict[int, List[OffsetAndMagic]] = dataclasses.field(
default_factory=lambda: collections.defaultdict(list)
)
def __init__(self) -> None:
self.magics: Dict[int, List[OffsetAndMagic]] = collections.defaultdict(list)

def visit_Assign(self, node: ast.Assign) -> None:
"""Look for system assign magics.
Expand Down
24 changes: 16 additions & 8 deletions src/black/linegen.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,8 +5,6 @@
import sys
from typing import Collection, Iterator, List, Optional, Set, Union

from dataclasses import dataclass, field

from black.nodes import WHITESPACE, STATEMENT, STANDALONE_COMMENT
from black.nodes import ASSIGNMENTS, OPENING_BRACKETS, CLOSING_BRACKETS
from black.nodes import Visitor, syms, first_child_is_arith, ensure_visible
Expand Down Expand Up @@ -40,17 +38,20 @@ class CannotSplit(CannotTransform):
"""A readable split that fits the allotted line length is impossible."""


@dataclass
# This isn't a dataclass because @dataclass + Generic breaks mypyc.
# See also https://github.com/mypyc/mypyc/issues/827.
class LineGenerator(Visitor[Line]):
"""Generates reformatted Line objects. Empty lines are not emitted.

Note: destroys the tree it's visiting by mutating prefixes of its leaves
in ways that will no longer stringify to valid Python code on the tree.
"""

mode: Mode
remove_u_prefix: bool = False
current_line: Line = field(init=False)
def __init__(self, mode: Mode, remove_u_prefix: bool = False) -> None:
self.mode = mode
self.remove_u_prefix = remove_u_prefix
self.current_line: Line
self.__post_init__()

def line(self, indent: int = 0) -> Iterator[Line]:
"""Generate a line.
Expand Down Expand Up @@ -335,7 +336,9 @@ def transform_line(
transformers = [left_hand_split]
else:

def rhs(line: Line, features: Collection[Feature]) -> Iterator[Line]:
def _rhs(
self: object, line: Line, features: Collection[Feature]
) -> Iterator[Line]:
"""Wraps calls to `right_hand_split`.

The calls increasingly `omit` right-hand trailers (bracket pairs with
Expand All @@ -362,6 +365,11 @@ def rhs(line: Line, features: Collection[Feature]) -> Iterator[Line]:
line, line_length=mode.line_length, features=features
)

# HACK: functions (like rhs) compiled by mypyc don't retain their __name__
ichard26 marked this conversation as resolved.
Show resolved Hide resolved
# attribute which is needed in `run_transformer` further down. Unfortunately
# a nested class breaks mypyc too. So a class must be created via type ...
rhs = type("rhs", (), {"__call__": _rhs})()

if mode.experimental_string_processing:
if line.inside_brackets:
transformers = [
Expand Down Expand Up @@ -962,7 +970,7 @@ def run_transformer(
result.extend(transform_line(transformed_line, mode=mode, features=features))

if (
transform.__name__ != "rhs"
transform.__class__.__name__ != "rhs"
or not line.bracket_tracker.invisible
or any(bracket.value for bracket in line.bracket_tracker.invisible)
or line.contains_multiline_strings()
Expand Down
3 changes: 2 additions & 1 deletion src/black/mode.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@

from dataclasses import dataclass, field
from enum import Enum
from operator import attrgetter
from typing import Dict, Set

from black.const import DEFAULT_LINE_LENGTH
Expand Down Expand Up @@ -109,7 +110,7 @@ def get_cache_key(self) -> str:
if self.target_versions:
version_str = ",".join(
str(version.value)
for version in sorted(self.target_versions, key=lambda v: v.value)
for version in sorted(self.target_versions, key=attrgetter("value"))
)
else:
version_str = "-"
Expand Down
Loading