From cb7b6c61cd14fe7b2e6bc0774f805b6b6f94d235 Mon Sep 17 00:00:00 2001 From: Michael Xie Date: Tue, 19 Dec 2023 21:26:09 -0800 Subject: [PATCH] domain_to_idxs typo --- experimental/data_selection/dsir_pipeline.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/experimental/data_selection/dsir_pipeline.py b/experimental/data_selection/dsir_pipeline.py index 737cb59..c3e7d1d 100644 --- a/experimental/data_selection/dsir_pipeline.py +++ b/experimental/data_selection/dsir_pipeline.py @@ -218,10 +218,10 @@ def compute_domain_idxs(filter_domains): if domain in todo_domains: domain_to_idxs[domain].append(i) for domain, idxs in domain_to_idxs.items(): - np.save(ds_path / f"{domain.replace(' ', '_')}_idxs.npy", np.asarray(idxs)) - domain_idxs_path = ds_path / f"{domain.replace(' ', '_')}_idxs.npy" + for domain in filter_domains: + domain_idxs_path = ds_path / f"{domain.replace(' ', '_')}_idxs.npy" domain_idxs = np.load(domain_idxs_path) domain_to_idxs[domain] = domain_idxs