Skip to content

Commit 6d99292

Browse files
ayushdgnicoleeeluo
authored andcommitted
Fix failing GPU tests with latest pandas bump (NVIDIA#41)
Signed-off-by: Ayush Dattagupta <[email protected]> Signed-off-by: Nicole Luo <[email protected]>
1 parent 417e874 commit 6d99292

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

tests/test_fuzzy_dedup.py

+4-2
Original file line numberDiff line numberDiff line change
@@ -114,7 +114,7 @@ def test_minhash_approximation(
114114
tuple(zip(minhash_signatures, strings))
115115
):
116116
true_jaccard = jaccard_index(str1, str2, char_ngrams)
117-
minhash_approximation = minhash_overlap(sig1, sig2)
117+
minhash_approximation = minhash_overlap(np.array(sig1), np.array(sig2))
118118
assert abs(true_jaccard - minhash_approximation) < THRESHOLD
119119

120120
def test_minhash_cache(self, fuzzy_dedup_data, tmpdir):
@@ -172,7 +172,9 @@ def test_multiple_id_cols(self, tmpdir):
172172
)
173173
buckets = lsh(self.dataset)
174174
buckets_df = buckets.df.compute().to_pandas()
175-
buckets_df["new_id"] = list(zip(buckets_df.dataset_id, buckets_df.id))
175+
buckets_df["new_id"] = list(
176+
map(list, zip(buckets_df.dataset_id, buckets_df.id))
177+
)
176178
docs_list = buckets_df.groupby("_bucket_id").new_id.apply(list)
177179
expected_df = cudf.Series(
178180
[[(1, 1), (1, 2)], [(1, 2), (2, 3)], [(3, 4), (4, 5)]], name="new_id"

0 commit comments

Comments
 (0)