Skip to content

Commit d89eba7

Browse files
TST (string dtype): xfail all currently failing tests with future.infer_string
1 parent b3b65a3 commit d89eba7

File tree

13 files changed

+72
-0
lines changed

13 files changed

+72
-0
lines changed

pandas/tests/arrays/floating/test_arithmetic.py

+3
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,8 @@
33
import numpy as np
44
import pytest
55

6+
from pandas._config import using_string_dtype
7+
68
import pandas as pd
79
import pandas._testing as tm
810
from pandas.core.arrays import FloatingArray
@@ -122,6 +124,7 @@ def test_arith_zero_dim_ndarray(other):
122124
# -----------------------------------------------------------------------------
123125

124126

127+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
125128
def test_error_invalid_values(data, all_arithmetic_operators, using_infer_string):
126129
op = all_arithmetic_operators
127130
s = pd.Series(data)

pandas/tests/arrays/integer/test_arithmetic.py

+3
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,8 @@
33
import numpy as np
44
import pytest
55

6+
from pandas._config import using_string_dtype
7+
68
import pandas as pd
79
import pandas._testing as tm
810
from pandas.core import ops
@@ -172,6 +174,7 @@ def test_numpy_zero_dim_ndarray(other):
172174
# -----------------------------------------------------------------------------
173175

174176

177+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
175178
def test_error_invalid_values(data, all_arithmetic_operators, using_infer_string):
176179
op = all_arithmetic_operators
177180
s = pd.Series(data)

pandas/tests/extension/test_arrow.py

+3
Original file line numberDiff line numberDiff line change
@@ -32,6 +32,8 @@
3232
import numpy as np
3333
import pytest
3434

35+
from pandas._config import using_string_dtype
36+
3537
from pandas._libs import lib
3638
from pandas._libs.tslibs import timezones
3739
from pandas.compat import (
@@ -1993,6 +1995,7 @@ def test_str_find_large_start():
19931995
tm.assert_series_equal(result, expected)
19941996

19951997

1998+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
19961999
@pytest.mark.skipif(
19972000
pa_version_under13p0, reason="https://github.com/apache/arrow/issues/36311"
19982001
)

pandas/tests/frame/methods/test_quantile.py

+8
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,8 @@
11
import numpy as np
22
import pytest
33

4+
from pandas._config import using_string_dtype
5+
46
import pandas as pd
57
from pandas import (
68
DataFrame,
@@ -324,6 +326,7 @@ def test_quantile_multi_empty(self, interp_method):
324326
)
325327
tm.assert_frame_equal(result, expected)
326328

329+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
327330
def test_quantile_datetime(self, unit):
328331
dti = pd.to_datetime(["2010", "2011"]).as_unit(unit)
329332
df = DataFrame({"a": dti, "b": [0, 5]})
@@ -377,6 +380,7 @@ def test_quantile_datetime(self, unit):
377380
expected = DataFrame(index=[0.5], columns=[])
378381
tm.assert_frame_equal(result, expected)
379382

383+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
380384
@pytest.mark.parametrize(
381385
"dtype",
382386
[
@@ -641,6 +645,7 @@ def test_quantile_nat(self, interp_method, unit):
641645
)
642646
tm.assert_frame_equal(res, exp)
643647

648+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
644649
def test_quantile_empty_no_rows_floats(self, interp_method):
645650
interpolation, method = interp_method
646651

@@ -869,6 +874,7 @@ def test_quantile_ea_scalar(self, request, obj, index):
869874
else:
870875
tm.assert_series_equal(result, expected)
871876

877+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
872878
@pytest.mark.parametrize(
873879
"dtype, expected_data, expected_index, axis",
874880
[
@@ -887,6 +893,7 @@ def test_empty_numeric(self, dtype, expected_data, expected_index, axis):
887893
)
888894
tm.assert_series_equal(result, expected)
889895

896+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
890897
@pytest.mark.parametrize(
891898
"dtype, expected_data, expected_index, axis, expected_dtype",
892899
[
@@ -905,6 +912,7 @@ def test_empty_datelike(
905912
)
906913
tm.assert_series_equal(result, expected)
907914

915+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
908916
@pytest.mark.parametrize(
909917
"expected_data, expected_index, axis",
910918
[

pandas/tests/frame/test_query_eval.py

+3
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,8 @@
33
import numpy as np
44
import pytest
55

6+
from pandas._config import using_string_dtype
7+
68
from pandas.errors import (
79
NumExprClobberingError,
810
UndefinedVariableError,
@@ -759,6 +761,7 @@ def test_inf(self, op, f, engine, parser):
759761
result = df.query(q, engine=engine, parser=parser)
760762
tm.assert_frame_equal(result, expected)
761763

764+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
762765
def test_check_tz_aware_index_query(self, tz_aware_fixture):
763766
# https://github.com/pandas-dev/pandas/issues/29463
764767
tz = tz_aware_fixture

pandas/tests/groupby/methods/test_value_counts.py

+4
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,8 @@
77
import numpy as np
88
import pytest
99

10+
from pandas._config import using_string_dtype
11+
1012
import pandas.util._test_decorators as td
1113

1214
from pandas import (
@@ -273,6 +275,7 @@ def _frame_value_counts(df, keys, normalize, sort, ascending):
273275
return df[keys].value_counts(normalize=normalize, sort=sort, ascending=ascending)
274276

275277

278+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
276279
@pytest.mark.parametrize("groupby", ["column", "array", "function"])
277280
@pytest.mark.parametrize("normalize, name", [(True, "proportion"), (False, "count")])
278281
@pytest.mark.parametrize(
@@ -356,6 +359,7 @@ def test_against_frame_and_seriesgroupby(
356359
tm.assert_frame_equal(result, expected)
357360

358361

362+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
359363
@pytest.mark.parametrize(
360364
"dtype",
361365
[

pandas/tests/groupby/test_grouping.py

+4
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,8 @@
1010
import numpy as np
1111
import pytest
1212

13+
from pandas._config import using_string_dtype
14+
1315
from pandas.errors import SpecificationError
1416

1517
import pandas as pd
@@ -805,6 +807,7 @@ def test_groupby_empty(self):
805807
expected = ["name"]
806808
assert result == expected
807809

810+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
808811
def test_groupby_level_index_value_all_na(self):
809812
# issue 20519
810813
df = DataFrame(
@@ -978,6 +981,7 @@ def test_groupby_with_empty(self):
978981
grouped = series.groupby(grouper)
979982
assert next(iter(grouped), None) is None
980983

984+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
981985
def test_groupby_with_single_column(self):
982986
df = DataFrame({"a": list("abssbab")})
983987
tm.assert_frame_equal(df.groupby("a").get_group("a"), df.iloc[[0, 5]])

pandas/tests/groupby/test_raises.py

+4
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,8 @@
88
import numpy as np
99
import pytest
1010

11+
from pandas._config import using_string_dtype
12+
1113
from pandas import (
1214
Categorical,
1315
DataFrame,
@@ -104,6 +106,7 @@ def _call_and_check(klass, msg, how, gb, groupby_func, args, warn_msg=""):
104106
gb.transform(groupby_func, *args)
105107

106108

109+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
107110
@pytest.mark.parametrize("how", ["method", "agg", "transform"])
108111
def test_groupby_raises_string(
109112
how, by, groupby_series, groupby_func, df_with_string_col
@@ -205,6 +208,7 @@ def func(x):
205208
getattr(gb, how)(func)
206209

207210

211+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
208212
@pytest.mark.parametrize("how", ["agg", "transform"])
209213
@pytest.mark.parametrize("groupby_func_np", [np.sum, np.mean])
210214
def test_groupby_raises_string_np(

pandas/tests/indexes/base_class/test_setops.py

+3
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,8 @@
33
import numpy as np
44
import pytest
55

6+
from pandas._config import using_string_dtype
7+
68
import pandas as pd
79
from pandas import (
810
Index,
@@ -231,6 +233,7 @@ def test_tuple_union_bug(self, method, expected, sort):
231233
expected = Index(expected)
232234
tm.assert_index_equal(result, expected)
233235

236+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
234237
@pytest.mark.parametrize("first_list", [["b", "a"], []])
235238
@pytest.mark.parametrize("second_list", [["a", "b"], []])
236239
@pytest.mark.parametrize(

pandas/tests/io/json/test_pandas.py

+11
Original file line numberDiff line numberDiff line change
@@ -189,6 +189,7 @@ def test_roundtrip_simple(self, orient, convert_axes, dtype, float_frame):
189189

190190
assert_json_roundtrip_equal(result, expected, orient)
191191

192+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
192193
@pytest.mark.parametrize("dtype", [False, np.int64])
193194
@pytest.mark.parametrize("convert_axes", [True, False])
194195
def test_roundtrip_intframe(self, orient, convert_axes, dtype, int_frame):
@@ -274,6 +275,7 @@ def test_roundtrip_empty(self, orient, convert_axes):
274275

275276
tm.assert_frame_equal(result, expected)
276277

278+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
277279
@pytest.mark.parametrize("convert_axes", [True, False])
278280
def test_roundtrip_timestamp(self, orient, convert_axes, datetime_frame):
279281
# TODO: improve coverage with date_format parameter
@@ -701,6 +703,7 @@ def test_series_roundtrip_simple(self, orient, string_series, using_infer_string
701703

702704
tm.assert_series_equal(result, expected)
703705

706+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
704707
@pytest.mark.parametrize("dtype", [False, None])
705708
def test_series_roundtrip_object(self, orient, dtype, object_series):
706709
data = StringIO(object_series.to_json(orient=orient))
@@ -810,6 +813,7 @@ def test_path(self, float_frame, int_frame, datetime_frame):
810813
df.to_json(path)
811814
read_json(path)
812815

816+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
813817
def test_axis_dates(self, datetime_series, datetime_frame):
814818
# frame
815819
json = StringIO(datetime_frame.to_json())
@@ -822,6 +826,7 @@ def test_axis_dates(self, datetime_series, datetime_frame):
822826
tm.assert_series_equal(result, datetime_series, check_names=False)
823827
assert result.name is None
824828

829+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
825830
def test_convert_dates(self, datetime_series, datetime_frame):
826831
# frame
827832
df = datetime_frame
@@ -912,6 +917,7 @@ def test_convert_dates_infer(self, infer_word):
912917
result = read_json(StringIO(ujson_dumps(data)))[["id", infer_word]]
913918
tm.assert_frame_equal(result, expected)
914919

920+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
915921
@pytest.mark.parametrize(
916922
"date,date_unit",
917923
[
@@ -972,6 +978,7 @@ def test_date_format_series_raises(self, datetime_series):
972978
with pytest.raises(ValueError, match=msg):
973979
ts.to_json(date_format="iso", date_unit="foo")
974980

981+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
975982
def test_date_unit(self, unit, datetime_frame):
976983
df = datetime_frame
977984
df["date"] = Timestamp("20130101 20:43:42").as_unit("ns")
@@ -1112,6 +1119,7 @@ def test_round_trip_exception(self, datapath):
11121119
res = res.fillna(np.nan)
11131120
tm.assert_frame_equal(res, df)
11141121

1122+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
11151123
@pytest.mark.network
11161124
@pytest.mark.single_cpu
11171125
@pytest.mark.parametrize(
@@ -1414,6 +1422,7 @@ def test_read_inline_jsonl(self):
14141422
expected = DataFrame([[1, 2], [1, 2]], columns=["a", "b"])
14151423
tm.assert_frame_equal(result, expected)
14161424

1425+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
14171426
@pytest.mark.single_cpu
14181427
@td.skip_if_not_us_locale
14191428
def test_read_s3_jsonl(self, s3_public_bucket_with_data, s3so):
@@ -2013,6 +2022,7 @@ def test_json_multiindex(self):
20132022
result = series.to_json(orient="index")
20142023
assert result == expected
20152024

2025+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
20162026
@pytest.mark.single_cpu
20172027
def test_to_s3(self, s3_public_bucket, s3so):
20182028
# GH 28375
@@ -2134,6 +2144,7 @@ def test_json_uint64(self):
21342144
result = df.to_json(orient="split")
21352145
assert result == expected
21362146

2147+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)", strict=False)
21372148
def test_read_json_dtype_backend(
21382149
self, string_storage, dtype_backend, orient, using_infer_string
21392150
):

pandas/tests/io/pytables/test_timezones.py

+8
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,8 @@
66
import numpy as np
77
import pytest
88

9+
from pandas._config import using_string_dtype
10+
911
from pandas._libs.tslibs.timezones import maybe_get_tz
1012
import pandas.util._test_decorators as td
1113

@@ -42,6 +44,7 @@ def _compare_with_tz(a, b):
4244
gettz_pytz = lambda x: x
4345

4446

47+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
4548
@pytest.mark.parametrize("gettz", [gettz_dateutil, gettz_pytz])
4649
def test_append_with_timezones(setup_path, gettz):
4750
# as columns
@@ -216,6 +219,7 @@ def test_tseries_select_index_column(setup_path):
216219
assert rng.tz == result.dt.tz
217220

218221

222+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
219223
def test_timezones_fixed_format_frame_non_empty(setup_path):
220224
with ensure_clean_store(setup_path) as store:
221225
# index
@@ -245,6 +249,7 @@ def test_timezones_fixed_format_frame_non_empty(setup_path):
245249
tm.assert_frame_equal(result, df)
246250

247251

252+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
248253
def test_timezones_fixed_format_empty(setup_path, tz_aware_fixture, frame_or_series):
249254
# GH 20594
250255

@@ -260,6 +265,7 @@ def test_timezones_fixed_format_empty(setup_path, tz_aware_fixture, frame_or_ser
260265
tm.assert_equal(result, obj)
261266

262267

268+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
263269
def test_timezones_fixed_format_series_nonempty(setup_path, tz_aware_fixture):
264270
# GH 20594
265271

@@ -312,6 +318,7 @@ def test_store_timezone(setup_path):
312318
tm.assert_frame_equal(result, df)
313319

314320

321+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
315322
def test_dst_transitions(setup_path):
316323
# make sure we are not failing on transitions
317324
with ensure_clean_store(setup_path) as store:
@@ -332,6 +339,7 @@ def test_dst_transitions(setup_path):
332339
tm.assert_frame_equal(result, df)
333340

334341

342+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
335343
def test_read_with_where_tz_aware_index(tmp_path, setup_path):
336344
# GH 11926
337345
periods = 10

pandas/tests/io/test_sql.py

+5
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,8 @@
1818
import numpy as np
1919
import pytest
2020

21+
from pandas._config import using_string_dtype
22+
2123
from pandas._libs import lib
2224
from pandas.compat import pa_version_under14p1
2325
from pandas.compat._optional import import_optional_dependency
@@ -1794,6 +1796,7 @@ def test_api_date_parsing(conn, request):
17941796
]
17951797

17961798

1799+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
17971800
@pytest.mark.parametrize("conn", all_connectable_types)
17981801
@pytest.mark.parametrize("error", ["raise", "coerce"])
17991802
@pytest.mark.parametrize(
@@ -3183,6 +3186,7 @@ class DummyException(Exception):
31833186
assert len(res2) == 1
31843187

31853188

3189+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
31863190
@pytest.mark.parametrize("conn", sqlalchemy_connectable)
31873191
def test_get_schema_create_table(conn, request, test_frame3):
31883192
# Use a dataframe without a bool column, since MySQL converts bool to
@@ -3574,6 +3578,7 @@ def test_read_sql_dtype_backend(
35743578
tm.assert_frame_equal(result, expected)
35753579

35763580

3581+
@pytest.mark.xfail(using_string_dtype(), reason="TODO(infer_string)")
35773582
@pytest.mark.parametrize("conn", all_connectable)
35783583
@pytest.mark.parametrize("func", ["read_sql", "read_sql_table"])
35793584
def test_read_sql_dtype_backend_table(

0 commit comments

Comments
 (0)