forked from pandas-dev/pandas
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
STYLE use pd_array in core (pandas-dev#40319)
- Loading branch information
1 parent
ae8849c
commit fb04a42
Showing
5 changed files
with
113 additions
and
2 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,26 @@ | ||
import pytest | ||
|
||
from scripts.use_pd_array_in_core import use_pd_array | ||
|
||
BAD_FILE_0 = "import pandas as pd\npd.array" | ||
BAD_FILE_1 = "\nfrom pandas import array" | ||
GOOD_FILE_0 = "from pandas import array as pd_array" | ||
GOOD_FILE_1 = "from pandas.core.construction import array as pd_array" | ||
PATH = "t.py" | ||
|
||
|
||
@pytest.mark.parametrize("content", [BAD_FILE_0, BAD_FILE_1]) | ||
def test_inconsistent_usage(content, capsys): | ||
result_msg = ( | ||
"t.py:2:0: Don't use pd.array in core, import array as pd_array instead\n" | ||
) | ||
with pytest.raises(SystemExit): | ||
use_pd_array(content, PATH) | ||
expected_msg, _ = capsys.readouterr() | ||
assert result_msg == expected_msg | ||
|
||
|
||
@pytest.mark.parametrize("content", [GOOD_FILE_0, GOOD_FILE_1]) | ||
def test_consistent_usage(content): | ||
# should not raise | ||
use_pd_array(content, PATH) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,77 @@ | ||
""" | ||
Check that pandas/core imports pandas.array as pd_array. | ||
This makes it easier to grep for usage of pandas array. | ||
This is meant to be run as a pre-commit hook - to run it manually, you can do: | ||
pre-commit run use-pd_array-in-core --all-files | ||
""" | ||
|
||
import argparse | ||
import ast | ||
import sys | ||
from typing import ( | ||
Optional, | ||
Sequence, | ||
) | ||
|
||
ERROR_MESSAGE = ( | ||
"{path}:{lineno}:{col_offset}: " | ||
"Don't use pd.array in core, import array as pd_array instead\n" | ||
) | ||
|
||
|
||
class Visitor(ast.NodeVisitor): | ||
def __init__(self, path: str) -> None: | ||
self.path = path | ||
|
||
def visit_ImportFrom(self, node: ast.ImportFrom) -> None: | ||
# If array has been imported from somewhere in pandas, | ||
# check it's aliased as pd_array. | ||
if ( | ||
node.module is not None | ||
and node.module.startswith("pandas") | ||
and any(i.name == "array" and i.asname != "pd_array" for i in node.names) | ||
): | ||
msg = ERROR_MESSAGE.format( | ||
path=self.path, lineno=node.lineno, col_offset=node.col_offset | ||
) | ||
sys.stdout.write(msg) | ||
sys.exit(1) | ||
super().generic_visit(node) | ||
|
||
def visit_Attribute(self, node: ast.Attribute) -> None: | ||
if ( | ||
isinstance(node.value, ast.Name) | ||
and node.value.id == "pd" | ||
and node.attr == "array" | ||
): | ||
msg = ERROR_MESSAGE.format( | ||
path=self.path, lineno=node.lineno, col_offset=node.col_offset | ||
) | ||
sys.stdout.write(msg) | ||
sys.exit(1) | ||
super().generic_visit(node) | ||
|
||
|
||
def use_pd_array(content: str, path: str) -> None: | ||
tree = ast.parse(content) | ||
visitor = Visitor(path) | ||
visitor.visit(tree) | ||
|
||
|
||
def main(argv: Optional[Sequence[str]] = None) -> None: | ||
parser = argparse.ArgumentParser() | ||
parser.add_argument("paths", nargs="*") | ||
args = parser.parse_args(argv) | ||
|
||
for path in args.paths: | ||
with open(path, encoding="utf-8") as fd: | ||
content = fd.read() | ||
use_pd_array(content, path) | ||
|
||
|
||
if __name__ == "__main__": | ||
main() |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters