-
-
Couldn't load subscription status.
- Fork 19.2k
BUG: groupby.idxmin/idxmax with all NA values should raise #62026
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 3 commits
7b77ce1
3be5083
4c03fc7
fbfff81
2898f2c
c0038fd
f618d87
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -272,7 +272,7 @@ def test_idxmin_idxmax_extremes_skipna(skipna, how, float_numpy_dtype): | |
| max_value = np.finfo(float_numpy_dtype).max | ||
| df = DataFrame( | ||
| { | ||
| "a": Series(np.repeat(range(1, 6), repeats=2), dtype="intp"), | ||
| "a": Series(np.repeat(range(1, 5), repeats=2), dtype="intp"), | ||
| "b": Series( | ||
| [ | ||
| np.nan, | ||
|
|
@@ -283,8 +283,6 @@ def test_idxmin_idxmax_extremes_skipna(skipna, how, float_numpy_dtype): | |
| np.nan, | ||
| max_value, | ||
| np.nan, | ||
| np.nan, | ||
| np.nan, | ||
|
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. this change is bc there's an all-NA group so itll now raise? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Yes, and the case of testing for raising is done elsewhere. |
||
| ], | ||
| dtype=float_numpy_dtype, | ||
| ), | ||
|
|
@@ -299,7 +297,7 @@ def test_idxmin_idxmax_extremes_skipna(skipna, how, float_numpy_dtype): | |
| return | ||
| result = getattr(gb, how)(skipna=skipna) | ||
| expected = DataFrame( | ||
| {"b": [1, 3, 4, 6, np.nan]}, index=pd.Index(range(1, 6), name="a", dtype="intp") | ||
| {"b": [1, 3, 4, 6]}, index=pd.Index(range(1, 5), name="a", dtype="intp") | ||
| ) | ||
| tm.assert_frame_equal(result, expected) | ||
|
|
||
|
|
@@ -1003,8 +1001,6 @@ def test_string_dtype_all_na( | |
| else: | ||
| expected_dtype = "int64" | ||
| expected_value = 1 if reduction_func == "size" else 0 | ||
| elif reduction_func in ["idxmin", "idxmax"]: | ||
| expected_dtype, expected_value = "float64", np.nan | ||
| elif not skipna or min_count > 0: | ||
| expected_value = pd.NA | ||
| elif reduction_func == "sum": | ||
|
|
@@ -1032,8 +1028,11 @@ def test_string_dtype_all_na( | |
| with pytest.raises(TypeError, match=msg): | ||
| method(*args, **kwargs) | ||
| return | ||
| elif reduction_func in ["idxmin", "idxmax"] and not skipna: | ||
| msg = f"{reduction_func} with skipna=False encountered an NA value." | ||
| elif reduction_func in ["idxmin", "idxmax"]: | ||
| if skipna: | ||
| msg = f"{reduction_func} with skipna=True encountered all NA values" | ||
| else: | ||
| msg = f"{reduction_func} with skipna=False encountered an NA value." | ||
| with pytest.raises(ValueError, match=msg): | ||
| method(*args, **kwargs) | ||
| return | ||
|
|
||
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
does 10694 cover both of these cases?
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
No - added the linked issue in the OP. Thanks!