333 lines
8.1 KiB
Python
333 lines
8.1 KiB
Python
from __future__ import annotations
|
|
|
|
import subprocess
|
|
import sys
|
|
|
|
import pytest
|
|
|
|
import pandas as pd
|
|
from pandas import api
|
|
import pandas._testing as tm
|
|
|
|
|
|
class Base:
|
|
def check(self, namespace, expected, ignored=None):
|
|
# see which names are in the namespace, minus optional
|
|
# ignored ones
|
|
# compare vs the expected
|
|
|
|
result = sorted(
|
|
f for f in dir(namespace) if not f.startswith("__") and f != "annotations"
|
|
)
|
|
if ignored is not None:
|
|
result = sorted(set(result) - set(ignored))
|
|
|
|
expected = sorted(expected)
|
|
tm.assert_almost_equal(result, expected)
|
|
|
|
|
|
class TestPDApi(Base):
|
|
# these are optionally imported based on testing
|
|
# & need to be ignored
|
|
ignored = ["tests", "locale", "conftest"]
|
|
|
|
# top-level sub-packages
|
|
public_lib = [
|
|
"api",
|
|
"arrays",
|
|
"options",
|
|
"test",
|
|
"testing",
|
|
"errors",
|
|
"plotting",
|
|
"io",
|
|
"tseries",
|
|
]
|
|
private_lib = ["compat", "core", "pandas", "util"]
|
|
|
|
# these are already deprecated; awaiting removal
|
|
deprecated_modules: list[str] = ["np", "datetime"]
|
|
|
|
# misc
|
|
misc = ["IndexSlice", "NaT", "NA"]
|
|
|
|
# top-level classes
|
|
classes = [
|
|
"ArrowDtype",
|
|
"Categorical",
|
|
"CategoricalIndex",
|
|
"DataFrame",
|
|
"DateOffset",
|
|
"DatetimeIndex",
|
|
"ExcelFile",
|
|
"ExcelWriter",
|
|
"Float64Index",
|
|
"Flags",
|
|
"Grouper",
|
|
"HDFStore",
|
|
"Index",
|
|
"Int64Index",
|
|
"MultiIndex",
|
|
"Period",
|
|
"PeriodIndex",
|
|
"RangeIndex",
|
|
"UInt64Index",
|
|
"Series",
|
|
"SparseDtype",
|
|
"StringDtype",
|
|
"Timedelta",
|
|
"TimedeltaIndex",
|
|
"Timestamp",
|
|
"Interval",
|
|
"IntervalIndex",
|
|
"CategoricalDtype",
|
|
"PeriodDtype",
|
|
"IntervalDtype",
|
|
"DatetimeTZDtype",
|
|
"BooleanDtype",
|
|
"Int8Dtype",
|
|
"Int16Dtype",
|
|
"Int32Dtype",
|
|
"Int64Dtype",
|
|
"UInt8Dtype",
|
|
"UInt16Dtype",
|
|
"UInt32Dtype",
|
|
"UInt64Dtype",
|
|
"Float32Dtype",
|
|
"Float64Dtype",
|
|
"NamedAgg",
|
|
]
|
|
|
|
# these are already deprecated; awaiting removal
|
|
deprecated_classes: list[str] = ["Float64Index", "Int64Index", "UInt64Index"]
|
|
|
|
# these should be deprecated in the future
|
|
deprecated_classes_in_future: list[str] = ["SparseArray"]
|
|
|
|
# external modules exposed in pandas namespace
|
|
modules: list[str] = []
|
|
|
|
# top-level functions
|
|
funcs = [
|
|
"array",
|
|
"bdate_range",
|
|
"concat",
|
|
"crosstab",
|
|
"cut",
|
|
"date_range",
|
|
"interval_range",
|
|
"eval",
|
|
"factorize",
|
|
"get_dummies",
|
|
"from_dummies",
|
|
"infer_freq",
|
|
"isna",
|
|
"isnull",
|
|
"lreshape",
|
|
"melt",
|
|
"notna",
|
|
"notnull",
|
|
"offsets",
|
|
"merge",
|
|
"merge_ordered",
|
|
"merge_asof",
|
|
"period_range",
|
|
"pivot",
|
|
"pivot_table",
|
|
"qcut",
|
|
"show_versions",
|
|
"timedelta_range",
|
|
"unique",
|
|
"value_counts",
|
|
"wide_to_long",
|
|
]
|
|
|
|
# top-level option funcs
|
|
funcs_option = [
|
|
"reset_option",
|
|
"describe_option",
|
|
"get_option",
|
|
"option_context",
|
|
"set_option",
|
|
"set_eng_float_format",
|
|
]
|
|
|
|
# top-level read_* funcs
|
|
funcs_read = [
|
|
"read_clipboard",
|
|
"read_csv",
|
|
"read_excel",
|
|
"read_fwf",
|
|
"read_gbq",
|
|
"read_hdf",
|
|
"read_html",
|
|
"read_xml",
|
|
"read_json",
|
|
"read_pickle",
|
|
"read_sas",
|
|
"read_sql",
|
|
"read_sql_query",
|
|
"read_sql_table",
|
|
"read_stata",
|
|
"read_table",
|
|
"read_feather",
|
|
"read_parquet",
|
|
"read_orc",
|
|
"read_spss",
|
|
]
|
|
|
|
# top-level json funcs
|
|
funcs_json = ["json_normalize"]
|
|
|
|
# top-level to_* funcs
|
|
funcs_to = ["to_datetime", "to_numeric", "to_pickle", "to_timedelta"]
|
|
|
|
# top-level to deprecate in the future
|
|
deprecated_funcs_in_future: list[str] = []
|
|
|
|
# these are already deprecated; awaiting removal
|
|
deprecated_funcs: list[str] = []
|
|
|
|
# private modules in pandas namespace
|
|
private_modules = [
|
|
"_config",
|
|
"_libs",
|
|
"_is_numpy_dev",
|
|
"_testing",
|
|
"_typing",
|
|
"_version",
|
|
]
|
|
|
|
def test_api(self):
|
|
|
|
checkthese = (
|
|
self.public_lib
|
|
+ self.private_lib
|
|
+ self.misc
|
|
+ self.modules
|
|
+ self.classes
|
|
+ self.funcs
|
|
+ self.funcs_option
|
|
+ self.funcs_read
|
|
+ self.funcs_json
|
|
+ self.funcs_to
|
|
+ self.private_modules
|
|
)
|
|
self.check(namespace=pd, expected=checkthese, ignored=self.ignored)
|
|
|
|
def test_api_all(self):
|
|
expected = set(
|
|
self.public_lib
|
|
+ self.misc
|
|
+ self.modules
|
|
+ self.classes
|
|
+ self.funcs
|
|
+ self.funcs_option
|
|
+ self.funcs_read
|
|
+ self.funcs_json
|
|
+ self.funcs_to
|
|
) - set(self.deprecated_classes)
|
|
actual = set(pd.__all__)
|
|
|
|
extraneous = actual - expected
|
|
assert not extraneous
|
|
|
|
missing = expected - actual
|
|
assert not missing
|
|
|
|
def test_depr(self):
|
|
deprecated_list = (
|
|
self.deprecated_modules
|
|
+ self.deprecated_classes
|
|
+ self.deprecated_classes_in_future
|
|
+ self.deprecated_funcs
|
|
+ self.deprecated_funcs_in_future
|
|
)
|
|
for depr in deprecated_list:
|
|
with tm.assert_produces_warning(FutureWarning):
|
|
_ = getattr(pd, depr)
|
|
|
|
|
|
def test_datetime():
|
|
from datetime import datetime
|
|
import warnings
|
|
|
|
with warnings.catch_warnings():
|
|
warnings.simplefilter("ignore", FutureWarning)
|
|
assert datetime(2015, 1, 2, 0, 0) == datetime(2015, 1, 2, 0, 0)
|
|
|
|
assert isinstance(datetime(2015, 1, 2, 0, 0), datetime)
|
|
|
|
|
|
def test_sparsearray():
|
|
import warnings
|
|
|
|
with warnings.catch_warnings():
|
|
warnings.simplefilter("ignore", FutureWarning)
|
|
assert isinstance(pd.array([1, 2, 3], dtype="Sparse"), pd.SparseArray)
|
|
|
|
|
|
def test_np():
|
|
import warnings
|
|
|
|
import numpy as np
|
|
|
|
with warnings.catch_warnings():
|
|
warnings.simplefilter("ignore", FutureWarning)
|
|
assert (pd.np.arange(0, 10) == np.arange(0, 10)).all()
|
|
|
|
|
|
class TestApi(Base):
|
|
allowed = ["types", "extensions", "indexers", "interchange"]
|
|
|
|
def test_api(self):
|
|
self.check(api, self.allowed)
|
|
|
|
|
|
class TestTesting(Base):
|
|
funcs = [
|
|
"assert_frame_equal",
|
|
"assert_series_equal",
|
|
"assert_index_equal",
|
|
"assert_extension_array_equal",
|
|
]
|
|
|
|
def test_testing(self):
|
|
from pandas import testing # noqa: PDF015
|
|
|
|
self.check(testing, self.funcs)
|
|
|
|
def test_util_testing_deprecated(self):
|
|
# avoid cache state affecting the test
|
|
sys.modules.pop("pandas.util.testing", None)
|
|
|
|
with tm.assert_produces_warning(FutureWarning) as m:
|
|
import pandas.util.testing # noqa: F401
|
|
|
|
assert "pandas.util.testing is deprecated" in str(m[0].message)
|
|
assert "pandas.testing instead" in str(m[0].message)
|
|
|
|
def test_util_testing_deprecated_direct(self):
|
|
# avoid cache state affecting the test
|
|
sys.modules.pop("pandas.util.testing", None)
|
|
with tm.assert_produces_warning(FutureWarning) as m:
|
|
from pandas.util.testing import assert_series_equal # noqa: F401
|
|
|
|
assert "pandas.util.testing is deprecated" in str(m[0].message)
|
|
assert "pandas.testing instead" in str(m[0].message)
|
|
|
|
def test_util_in_top_level(self):
|
|
# in a subprocess to avoid import caching issues
|
|
out = subprocess.check_output(
|
|
[
|
|
sys.executable,
|
|
"-c",
|
|
"import pandas; pandas.util.testing.assert_series_equal",
|
|
],
|
|
stderr=subprocess.STDOUT,
|
|
).decode()
|
|
assert "pandas.util.testing is deprecated" in out
|
|
|
|
with pytest.raises(AttributeError, match="foo"):
|
|
pd.util.foo
|