diff --git a/dev/sparktestsupport/modules.py b/dev/sparktestsupport/modules.py index 202263febc93..ad164b1a8636 100644 --- a/dev/sparktestsupport/modules.py +++ b/dev/sparktestsupport/modules.py @@ -1059,6 +1059,21 @@ def __hash__(self): ], python_test_goals=[ # pandas-on-Spark unittests + "pyspark.pandas.tests.connect.test_parity_categorical", + "pyspark.pandas.tests.connect.test_parity_config", + "pyspark.pandas.tests.connect.test_parity_extension", + "pyspark.pandas.tests.connect.test_parity_frame_spark", + "pyspark.pandas.tests.connect.test_parity_generic_functions", + "pyspark.pandas.tests.connect.test_parity_indexops_spark", + "pyspark.pandas.tests.connect.test_parity_internal", + "pyspark.pandas.tests.connect.test_parity_namespace", + "pyspark.pandas.tests.connect.test_parity_numpy_compat", + "pyspark.pandas.tests.connect.test_parity_repr", + "pyspark.pandas.tests.connect.test_parity_scalars", + "pyspark.pandas.tests.connect.test_parity_spark_functions", + "pyspark.pandas.tests.connect.test_parity_sql", + "pyspark.pandas.tests.connect.test_parity_typedef", + "pyspark.pandas.tests.connect.test_parity_utils", "pyspark.pandas.tests.connect.data_type_ops.test_parity_as_type", "pyspark.pandas.tests.connect.data_type_ops.test_parity_base", "pyspark.pandas.tests.connect.data_type_ops.test_parity_binary_ops", @@ -1073,37 +1088,15 @@ def __hash__(self): "pyspark.pandas.tests.connect.data_type_ops.test_parity_string_ops", "pyspark.pandas.tests.connect.data_type_ops.test_parity_udt_ops", "pyspark.pandas.tests.connect.data_type_ops.test_parity_timedelta_ops", - "pyspark.pandas.tests.connect.indexes.test_parity_category", - "pyspark.pandas.tests.connect.indexes.test_parity_timedelta", "pyspark.pandas.tests.connect.plot.test_parity_frame_plot", "pyspark.pandas.tests.connect.plot.test_parity_frame_plot_matplotlib", "pyspark.pandas.tests.connect.plot.test_parity_frame_plot_plotly", "pyspark.pandas.tests.connect.plot.test_parity_series_plot", "pyspark.pandas.tests.connect.plot.test_parity_series_plot_matplotlib", "pyspark.pandas.tests.connect.plot.test_parity_series_plot_plotly", - "pyspark.pandas.tests.connect.test_parity_categorical", - "pyspark.pandas.tests.connect.test_parity_config", "pyspark.pandas.tests.connect.indexes.test_parity_default", - "pyspark.pandas.tests.connect.test_parity_extension", - "pyspark.pandas.tests.connect.test_parity_frame_spark", - "pyspark.pandas.tests.connect.test_parity_generic_functions", - "pyspark.pandas.tests.connect.test_parity_indexops_spark", - "pyspark.pandas.tests.connect.test_parity_internal", - "pyspark.pandas.tests.connect.test_parity_namespace", - "pyspark.pandas.tests.connect.test_parity_numpy_compat", - "pyspark.pandas.tests.connect.test_parity_repr", - "pyspark.pandas.tests.connect.resample.test_parity_error", - "pyspark.pandas.tests.connect.resample.test_parity_missing", - "pyspark.pandas.tests.connect.resample.test_parity_on", - "pyspark.pandas.tests.connect.resample.test_parity_timezone", - "pyspark.pandas.tests.connect.test_parity_scalars", - "pyspark.pandas.tests.connect.series.test_parity_datetime", - "pyspark.pandas.tests.connect.series.test_parity_string_ops_adv", - "pyspark.pandas.tests.connect.series.test_parity_string_ops_basic", - "pyspark.pandas.tests.connect.test_parity_spark_functions", - "pyspark.pandas.tests.connect.test_parity_sql", - "pyspark.pandas.tests.connect.test_parity_typedef", - "pyspark.pandas.tests.connect.test_parity_utils", + "pyspark.pandas.tests.connect.indexes.test_parity_category", + "pyspark.pandas.tests.connect.indexes.test_parity_timedelta", "pyspark.pandas.tests.connect.indexes.test_parity_basic", "pyspark.pandas.tests.connect.indexes.test_parity_getattr", "pyspark.pandas.tests.connect.indexes.test_parity_name", @@ -1146,11 +1139,6 @@ def __hash__(self): "pyspark.pandas.tests.connect.computation.test_parity_describe", "pyspark.pandas.tests.connect.computation.test_parity_eval", "pyspark.pandas.tests.connect.computation.test_parity_melt", - "pyspark.pandas.tests.connect.frame.test_parity_attrs", - "pyspark.pandas.tests.connect.frame.test_parity_axis", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_dot_frame", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_dot_series", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_error", ], excluded_python_implementations=[ "PyPy" # Skip these tests under PyPy since they require numpy, pandas, and pyarrow and @@ -1166,6 +1154,8 @@ def __hash__(self): ], python_test_goals=[ # pandas-on-Spark unittests + "pyspark.pandas.tests.connect.frame.test_parity_attrs", + "pyspark.pandas.tests.connect.frame.test_parity_axis", "pyspark.pandas.tests.connect.frame.test_parity_constructor", "pyspark.pandas.tests.connect.frame.test_parity_conversion", "pyspark.pandas.tests.connect.frame.test_parity_reindexing", @@ -1183,14 +1173,9 @@ def __hash__(self): "pyspark.pandas.tests.connect.groupby.test_parity_split_apply_adv", "pyspark.pandas.tests.connect.groupby.test_parity_split_apply_basic", "pyspark.pandas.tests.connect.groupby.test_parity_split_apply_min_max", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_align", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_basic_slow", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_cov", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_corrwith", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_index", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_series", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_setitem_frame", - "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_setitem_series", + "pyspark.pandas.tests.connect.series.test_parity_datetime", + "pyspark.pandas.tests.connect.series.test_parity_string_ops_adv", + "pyspark.pandas.tests.connect.series.test_parity_string_ops_basic", "pyspark.pandas.tests.connect.series.test_parity_all_any", "pyspark.pandas.tests.connect.series.test_parity_arg_ops", "pyspark.pandas.tests.connect.series.test_parity_as_of", @@ -1203,6 +1188,7 @@ def __hash__(self): "pyspark.pandas.tests.connect.series.test_parity_series", "pyspark.pandas.tests.connect.series.test_parity_sort", "pyspark.pandas.tests.connect.series.test_parity_stat", + "pyspark.pandas.tests.connect.series.test_parity_interpolate", "pyspark.pandas.tests.connect.data_type_ops.test_parity_num_arithmetic", "pyspark.pandas.tests.connect.data_type_ops.test_parity_num_mod", "pyspark.pandas.tests.connect.data_type_ops.test_parity_num_mul_div", @@ -1235,15 +1221,15 @@ def __hash__(self): "pyspark.pandas.tests.connect.computation.test_parity_pivot_table_multi_idx", "pyspark.pandas.tests.connect.computation.test_parity_pivot_table_multi_idx_adv", "pyspark.pandas.tests.connect.computation.test_parity_stats", - "pyspark.pandas.tests.connect.indexes.test_parity_append", - "pyspark.pandas.tests.connect.indexes.test_parity_intersection", - "pyspark.pandas.tests.connect.indexes.test_parity_monotonic", - "pyspark.pandas.tests.connect.indexes.test_parity_union", + "pyspark.pandas.tests.connect.computation.test_parity_missing_data", "pyspark.pandas.tests.connect.frame.test_parity_interpolate", "pyspark.pandas.tests.connect.frame.test_parity_interpolate_error", - "pyspark.pandas.tests.connect.series.test_parity_interpolate", "pyspark.pandas.tests.connect.resample.test_parity_frame", "pyspark.pandas.tests.connect.resample.test_parity_series", + "pyspark.pandas.tests.connect.resample.test_parity_error", + "pyspark.pandas.tests.connect.resample.test_parity_missing", + "pyspark.pandas.tests.connect.resample.test_parity_on", + "pyspark.pandas.tests.connect.resample.test_parity_timezone", "pyspark.pandas.tests.connect.window.test_parity_ewm_error", "pyspark.pandas.tests.connect.window.test_parity_ewm_mean", "pyspark.pandas.tests.connect.window.test_parity_groupby_ewm_mean", @@ -1263,7 +1249,17 @@ def __hash__(self): "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_groupby_rolling", "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_groupby_rolling_adv", "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_groupby_rolling_count", - "pyspark.pandas.tests.connect.computation.test_parity_missing_data", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_dot_frame", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_dot_series", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_error", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_align", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_basic_slow", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_cov", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_corrwith", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_index", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_series", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_setitem_frame", + "pyspark.pandas.tests.connect.diff_frames_ops.test_parity_setitem_series", "pyspark.pandas.tests.connect.groupby.test_parity_index", "pyspark.pandas.tests.connect.groupby.test_parity_describe", "pyspark.pandas.tests.connect.groupby.test_parity_head_tail", @@ -1301,6 +1297,10 @@ def __hash__(self): "pyspark.pandas.tests.connect.groupby.test_parity_stat_ddof", "pyspark.pandas.tests.connect.groupby.test_parity_stat_func", "pyspark.pandas.tests.connect.groupby.test_parity_stat_prod", + "pyspark.pandas.tests.connect.indexes.test_parity_append", + "pyspark.pandas.tests.connect.indexes.test_parity_intersection", + "pyspark.pandas.tests.connect.indexes.test_parity_monotonic", + "pyspark.pandas.tests.connect.indexes.test_parity_union", "pyspark.pandas.tests.connect.indexes.test_parity_datetime", "pyspark.pandas.tests.connect.indexes.test_parity_datetime_at", "pyspark.pandas.tests.connect.indexes.test_parity_datetime_between",