Skip to content

Commit

Permalink
import from _compat
Browse files Browse the repository at this point in the history
Signed-off-by: Praateek <[email protected]>
  • Loading branch information
praateekmahajan committed Nov 15, 2024
1 parent c24e97e commit 76d7b4d
Showing 1 changed file with 1 addition and 8 deletions.
9 changes: 1 addition & 8 deletions nemo_curator/modules/fuzzy_dedup.py
Original file line number Diff line number Diff line change
Expand Up @@ -33,10 +33,9 @@
from cugraph import MultiGraph
from dask import dataframe as dd
from dask.utils import M
from packaging.version import parse as parse_version
from regex import F
from tqdm import tqdm

from nemo_curator._compat import MINHASH_PERMUTED_AVAILABLE
from nemo_curator.datasets import DocumentDataset
from nemo_curator.log import create_logger
from nemo_curator.modules.config import FuzzyDuplicatesConfig
Expand Down Expand Up @@ -66,12 +65,6 @@
write_partitioned_file,
)

CURRENT_CUDF_VERSION = parse_version(cudf.__version__)
MINHASH_PERMUTED_AVAILABLE = CURRENT_CUDF_VERSION >= parse_version("24.12.0") or (
CURRENT_CUDF_VERSION.is_prerelease
and CURRENT_CUDF_VERSION.base_version >= "24.12.0"
)


class MinHash:
"""
Expand Down

0 comments on commit 76d7b4d

Please sign in to comment.