From e98d131bce371463556cb6761d8d5a9e37f92cce Mon Sep 17 00:00:00 2001
From: ngreenwald <noahfgreenwald@gmail.com>
Date: Fri, 4 Sep 2020 10:00:07 -0700
Subject: [PATCH] simplify argument name

---
 caliban_toolbox/dataset_builder.py      | 6 +++---
 caliban_toolbox/dataset_builder_test.py | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/caliban_toolbox/dataset_builder.py b/caliban_toolbox/dataset_builder.py
index 8871413..88a901e 100644
--- a/caliban_toolbox/dataset_builder.py
+++ b/caliban_toolbox/dataset_builder.py
@@ -564,7 +564,7 @@ def _validate_output_shape(self, output_shape):
                              'or length 3, got {}'.format(output_shape))
 
     def build_dataset(self, tissues='all', platforms='all', output_shape=(512, 512), resize=False,
-                      data_split=(0.8, 0.1, 0.1), seed=0, balance_dataset=False, **kwargs):
+                      data_split=(0.8, 0.1, 0.1), seed=0, balance=False, **kwargs):
         """Construct a dataset for model training and evaluation
 
         Args:
@@ -582,7 +582,7 @@ def build_dataset(self, tissues='all', platforms='all', output_shape=(512, 512),
                     - by_image. Resizes by median cell size within each image
             data_split: tuple specifying the fraction of the dataset for train/val/test
             seed: seed for reproducible splitting of dataset
-            balance_dataset: if true, randomly duplicate less-represented tissue types
+            balance: if true, randomly duplicate less-represented tissue types
                 in train and val splits so that there are the same number of images of each type
             **kwargs: other arguments to be passed to helper functions
 
@@ -642,7 +642,7 @@ def build_dataset(self, tissues='all', platforms='all', output_shape=(512, 512),
                                               min_objects=min_objects)
 
             # don't balance test split
-            if balance_dataset and idx != 2:
+            if balance and idx != 2:
                 current_dict = self._balance_dict(current_dict, seed=seed, category='tissue_list')
 
             dicts[idx] = current_dict
diff --git a/caliban_toolbox/dataset_builder_test.py b/caliban_toolbox/dataset_builder_test.py
index 8dd387f..5914adf 100644
--- a/caliban_toolbox/dataset_builder_test.py
+++ b/caliban_toolbox/dataset_builder_test.py
@@ -708,7 +708,7 @@ def test_build_dataset(tmp_path):
     # full runthrough with default options changed
     _ = db.build_dataset(tissues='all', platforms=platforms, output_shape=(10, 10),
                          relabel=True, resize='by_image', small_object_threshold=5,
-                         balance_dataset=True)
+                         balance=True)
 
 
 def test_summarize_dataset(tmp_path):