update to the latest version

nnnnmj · Aug 5, 2022 · ca66910 · ca66910
1 parent acbe0e3
commit ca66910
Show file tree

Hide file tree

Showing 2 changed files with 4 additions and 3 deletions.
diff --git a/data_generator.py b/data_generator.py
@@ -269,6 +269,7 @@ def generator(self, X=None, y=None, minmax=True,
                                                              realistic_synthetic_mode=realistic_synthetic_mode,
                                                              alpha=alpha, percentage=percentage)
                     np.savez_compressed(os.path.join('datasets', 'synthetic', filepath), X=X, y=y)
+                    pass
 
             else:
                 X, y = self.generate_realistic_synthetic(X, y,

diff --git a/run.py b/run.py
@@ -132,7 +132,7 @@ def __init__(self, suffix:str=None, mode:str='rla', parallel:str=None,
     # dataset filter for delelting those datasets that do not satisfy the experimental requirement
     def dataset_filter(self):
         # dataset list in the current folder
-        dataset_list_org = [os.path.splitext(_)[0] for _ in os.listdir('datasets')]
+        dataset_list_org = [os.path.splitext(_)[0] for _ in os.listdir('datasets') if os.path.splitext(_)[1] in ['.npz', '.csv']]
         dataset_list_org = [_ for _ in dataset_list_org if not _.split('_')[0].isdigit()]
 
         dataset_list = []
@@ -160,7 +160,7 @@ def dataset_filter(self):
 
             # remove high-dimensional CV and NLP datasets if generating synthetic anomalies or robustness test
             if self.realistic_synthetic_mode is not None or self.noise_type is not None:
-                if any([_ in dataset for _ in ['CIFAR10, FashionMNIST', 'SVHN', 'agnews', 'amazon', 'imdb', 'yelp']]):
+                if self.isin_NLPCV(dataset):
                     add = False
 
             if add:
@@ -310,5 +310,5 @@ def run(self):
                 df_time.to_csv(os.path.join(os.getcwd(), 'result', 'Time_' + self.suffix + '.csv'), index=True)
 
 # run the above pipeline for reproducing the results in the paper
-pipeline = RunPipeline(suffix='ADBench', parallel='unsupervise', realistic_synthetic_mode='dependency', noise_type=None)
+pipeline = RunPipeline(suffix='ADBench', parallel='unsupervise', realistic_synthetic_mode='cluster', noise_type=None)
 pipeline.run()