Skip to content

Commit

Permalink
Remove DASK_DATAFRAME__QUERY_PLANNING environment variable (#270)
Browse files Browse the repository at this point in the history
* remove DASK_DATAFRAME__QUERY_PLANNING False

Signed-off-by: Sarah Yurick <[email protected]>

* isort

Signed-off-by: Sarah Yurick <[email protected]>

---------

Signed-off-by: Sarah Yurick <[email protected]>
  • Loading branch information
sarahyurick authored Oct 9, 2024
1 parent 06c388d commit bf2f8f2
Show file tree
Hide file tree
Showing 7 changed files with 1 addition and 13 deletions.
3 changes: 0 additions & 3 deletions examples/translation_example.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,4 @@
import os

os.environ["DASK_DATAFRAME__QUERY_PLANNING"] = "False"
import argparse
import re
import time
from dataclasses import dataclass
Expand Down
1 change: 0 additions & 1 deletion nemo_curator/classifiers/aegis.py
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,6 @@
import os

os.environ["RAPIDS_NO_INITIALIZE"] = "1"
os.environ["DASK_DATAFRAME__QUERY_PLANNING"] = "False"
from dataclasses import dataclass
from functools import lru_cache
from typing import List, Optional, Union
Expand Down
2 changes: 0 additions & 2 deletions nemo_curator/classifiers/fineweb_edu.py
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,6 @@
import os

os.environ["RAPIDS_NO_INITIALIZE"] = "1"
os.environ["DASK_DATAFRAME__QUERY_PLANNING"] = "False"
import torch
from crossfit import op
from crossfit.backend.torch.hf.model import HFModel
Expand All @@ -23,7 +22,6 @@
from nemo_curator.classifiers.base import (
DistributedDataClassifier,
_get_suggest_memory_for_classifier,
_run_classifier_helper,
)
from nemo_curator.datasets import DocumentDataset

Expand Down
1 change: 0 additions & 1 deletion nemo_curator/scripts/semdedup/clustering.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,6 @@
import os
from datetime import datetime

os.environ["DASK_DATAFRAME__QUERY_PLANNING"] = "False"
import dask_cudf

from nemo_curator.datasets import DocumentDataset
Expand Down
2 changes: 0 additions & 2 deletions tests/test_semdedup.py
Original file line number Diff line number Diff line change
Expand Up @@ -14,8 +14,6 @@
import os

import pytest

os.environ["DASK_DATAFRAME__QUERY_PLANNING"] = "False"
from dask.dataframe.utils import assert_eq
from distributed import Client

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -20,16 +20,14 @@
"name": "stdout",
"output_type": "stream",
"text": [
"env: PYTHONWARNINGS=ignore\n",
"env: DASK_DATAFRAME__QUERY_PLANNING=False\n"
"env: PYTHONWARNINGS=ignore\n"
]
}
],
"source": [
"# Silence Warnings (HuggingFace internal warnings)\n",
"\n",
"%env PYTHONWARNINGS=ignore\n",
"%env DASK_DATAFRAME__QUERY_PLANNING=False\n",
"import warnings\n",
"warnings.filterwarnings(\"ignore\")"
]
Expand Down
1 change: 0 additions & 1 deletion tutorials/single_node_tutorial/single_gpu_tutorial.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -110,7 +110,6 @@
},
"outputs": [],
"source": [
"%env DASK_DATAFRAME__QUERY_PLANNING False\n",
"%env CUDA_VISIBLE_DEVICES 0"
]
},
Expand Down

0 comments on commit bf2f8f2

Please sign in to comment.