diff --git a/nemo_curator/modules/config.py b/nemo_curator/modules/config.py index 74e61da9..67bf06af 100644 --- a/nemo_curator/modules/config.py +++ b/nemo_curator/modules/config.py @@ -135,7 +135,9 @@ def __post_init__(self): raise ValueError("Buckets per shuffle must be between [1, num_buckets]") if not self.perform_removal: - warnings.warn("In future releases (starting with 0.8.0) the default will be True.") + warnings.warn( + "In future releases (starting with 0.8.0) the default will be True." + ) @dataclass diff --git a/nemo_curator/modules/exact_dedup.py b/nemo_curator/modules/exact_dedup.py index e79efe3b..e537a548 100644 --- a/nemo_curator/modules/exact_dedup.py +++ b/nemo_curator/modules/exact_dedup.py @@ -73,7 +73,9 @@ def __init__( self.text_field = text_field self.perform_removal = perform_removal if not self.perform_removal: - warnings.warn("In future releases (starting with 0.8.0) the default will be True.") + warnings.warn( + "In future releases (starting with 0.8.0) the default will be True." + ) if self.perform_removal and cache_dir is None: warnings.warn("cache_dir is recommended to remove duplicates.") if cache_dir is None and profile_dir is not None: