diff --git a/nemo_curator/modules/__init__.py b/nemo_curator/modules/__init__.py index 2e105a020..631c08c02 100644 --- a/nemo_curator/modules/__init__.py +++ b/nemo_curator/modules/__init__.py @@ -13,7 +13,6 @@ # limitations under the License. from .add_id import AddId -from .distributed_data_classifier import DomainClassifier, QualityClassifier from .exact_dedup import ExactDuplicates from .filter import Filter, Score, ScoreFilter from .fuzzy_dedup import LSH, MinHash @@ -21,6 +20,10 @@ from .modify import Modify from .task import TaskDecontamination +# This import must come after all imports that require cugraph +# See this issue: https://github.com/rapidsai/cugraph/issues/2718 +from .distributed_data_classifier import DomainClassifier, QualityClassifier + __all__ = [ "DomainClassifier", "ExactDuplicates",