TorchEnsemble-Community
diff --git a/‎CHANGELOG.rst‎
Lines changed: 1 addition & 0 deletions b/‎CHANGELOG.rst‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎docs/index.rst‎
Lines changed: 3 additions & 0 deletions b/‎docs/index.rst‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎docs/quick_start.rst‎
Lines changed: 15 additions & 0 deletions b/‎docs/quick_start.rst‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎torchensemble/_base.py‎
Lines changed: 9 additions & 6 deletions b/‎torchensemble/_base.py‎
Lines changed: 9 additions & 6 deletions
diff --git a/‎torchensemble/_constants.py‎
Lines changed: 8 additions & 0 deletions b/‎torchensemble/_constants.py‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎torchensemble/adversarial_training.py‎
Lines changed: 36 additions & 14 deletions b/‎torchensemble/adversarial_training.py‎
Lines changed: 36 additions & 14 deletions
diff --git a/‎torchensemble/bagging.py‎
Lines changed: 35 additions & 13 deletions b/‎torchensemble/bagging.py‎
Lines changed: 35 additions & 13 deletions
@@ -18,6 +18,7 @@ Changelog
 Ver 0.1.*
 ---------
 
+* |Feature| |API| Support arbitrary training criteria for all ensembles except Gradient Boosting | `@by256 <https://github.com/by256>`__ and `@xuyxu <https://github.com/xuyxu>`__
 * |Fix| Fix missing functionality of ``save_model`` for :meth:`fit` of Soft Gradient Boosting | `@xuyxu <https://github.com/xuyxu>`__
 * |Feature| |API| Add :class:`SoftGradientBoostingClassifier` and :class:`SoftGradientBoostingRegressor` | `@xuyxu <https://github.com/xuyxu>`__
 * |Feature| |API| Support using dataloader with multiple input | `@xuyxu <https://github.com/xuyxu>`__
 
@@ -34,6 +34,9 @@ Example
       estimator=base_estimator,               # here is your deep learning model
       n_estimators=10,                        # number of base estimators
   )
+  # Set the criterion
+  criterion = nn.CrossEntropyLoss()           # training objective
+  ensemble.set_criterion(criterion)
 
   # Set the optimizer
   ensemble.set_optimizer(
 
@@ -82,6 +82,17 @@ The meaning of different arguments is listed as follow:
 * ``n_estimators``: The number of base estimators in the ensemble.
 * ``cuda``: Specify whether to use GPU for training and evaluating the ensemble.
 
+Set the Criterion
+-----------------
+
+The next step is to set the objective function. Since our ensemble model is a classifier, we 
+will use cross-entropy:
+
+.. code-block:: python
+
+    criterion = nn.CrossEntropyLoss()
+    model.set_criterion(criterion)
+
 Set the Optimizer
 -----------------
 
@@ -180,6 +191,10 @@ The script below shows an example on using VotingClassifier with 10 MLPs for cla
         cuda=True,
     )
 
+    # Set the criterion
+    criterion = nn.CrossEntropyLoss()
+    model.set_criterion(criterion)
+
     # Set the optimizer
     model.set_optimizer('Adam', lr=1e-3, weight_decay=5e-4)
 
 
@@ -33,6 +33,7 @@ def get_doc(item):
             "predict": const.__predict_doc,
             "set_optimizer": const.__set_optimizer_doc,
             "set_scheduler": const.__set_scheduler_doc,
+            "set_criterion": const.__set_criterion_doc,
             "classifier_forward": const.__classification_forward_doc,
             "classifier_evaluate": const.__classification_evaluate_doc,
             "regressor_forward": const.__regression_forward_doc,
@@ -137,6 +138,10 @@ def _validate_parameters(self, epochs, log_interval):
             self.logger.error(msg.format(log_interval))
             raise ValueError(msg.format(log_interval))
 
+    def set_criterion(self, criterion):
+        """Set the training criterion."""
+        self._criterion = criterion
+
     def set_optimizer(self, optimizer_name, **kwargs):
         """Set the parameter optimizer."""
         self.optimizer_name = optimizer_name
@@ -226,7 +231,6 @@ def evaluate(self, test_loader, return_loss=False):
         self.eval()
         correct = 0
         total = 0
-        criterion = nn.CrossEntropyLoss()
         loss = 0.0
 
         for _, elem in enumerate(test_loader):
@@ -235,7 +239,7 @@ def evaluate(self, test_loader, return_loss=False):
             _, predicted = torch.max(output.data, 1)
             correct += (predicted == target).sum().item()
             total += target.size(0)
-            loss += criterion(output, target)
+            loss += self._criterion(output, target)
 
         acc = 100 * correct / total
         loss /= len(test_loader)
@@ -273,12 +277,11 @@ def _decide_n_outputs(self, train_loader):
     def evaluate(self, test_loader):
         """Docstrings decorated by downstream ensembles."""
         self.eval()
-        mse = 0.0
-        criterion = nn.MSELoss()
+        loss = 0.0
 
         for _, elem in enumerate(test_loader):
             data, target = split_data_target(elem, self.device)
             output = self.forward(*data)
-            mse += criterion(output, target)
+            loss += self._criterion(output, target)
 
-        return float(mse) / len(test_loader)
+        return float(loss) / len(test_loader)
@@ -85,6 +85,14 @@
 """
 
 
+__set_criterion_doc = """
+    Parameters
+    ----------
+    criterion : torch.nn.loss
+        The customized training criterion object.
+"""
+
+
 __fit_doc = """
     Parameters
     ----------
 
@@ -246,6 +246,13 @@ def set_optimizer(self, optimizer_name, **kwargs):
     def set_scheduler(self, scheduler_name, **kwargs):
         super().set_scheduler(scheduler_name, **kwargs)
 
+    @torchensemble_model_doc(
+        """Set the training criterion for AdversarialTrainingClassifier.""",
+        "set_criterion",
+    )
+    def set_criterion(self, criterion):
+        super().set_criterion(criterion)
+
     @_adversarial_training_model_doc(
         """Implementation on the training stage of AdversarialTrainingClassifier.""",  # noqa: E501
         "fit",
@@ -282,8 +289,11 @@ def fit(
                 optimizers[0], self.scheduler_name, **self.scheduler_args
             )
 
+        # Check the training criterion
+        if not hasattr(self, "_criterion"):
+            self._criterion = nn.CrossEntropyLoss()
+
         # Utils
-        criterion = nn.CrossEntropyLoss()
         best_acc = 0.0
 
         # Internal helper function on pesudo forward
@@ -318,7 +328,7 @@ def _forward(estimators, *x):
                         estimator,
                         cur_lr,
                         optimizer,
-                        criterion,
+                        self._criterion,
                         idx,
                         epoch,
                         log_interval,
@@ -424,6 +434,13 @@ def set_optimizer(self, optimizer_name, **kwargs):
     def set_scheduler(self, scheduler_name, **kwargs):
         super().set_scheduler(scheduler_name, **kwargs)
 
+    @torchensemble_model_doc(
+        """Set the training criterion for AdversarialTrainingRegressor.""",
+        "set_criterion",
+    )
+    def set_criterion(self, criterion):
+        super().set_criterion(criterion)
+
     @_adversarial_training_model_doc(
         """Implementation on the training stage of AdversarialTrainingRegressor.""",  # noqa: E501
         "fit",
@@ -460,9 +477,12 @@ def fit(
                 optimizers[0], self.scheduler_name, **self.scheduler_args
             )
 
+        # Check the training criterion
+        if not hasattr(self, "_criterion"):
+            self._criterion = nn.MSELoss()
+
         # Utils
-        criterion = nn.MSELoss()
-        best_mse = float("inf")
+        best_loss = float("inf")
 
         # Internal helper function on pesudo forward
         def _forward(estimators, *x):
@@ -494,7 +514,7 @@ def _forward(estimators, *x):
                         estimator,
                         cur_lr,
                         optimizer,
-                        criterion,
+                        self._criterion,
                         idx,
                         epoch,
                         log_interval,
@@ -515,31 +535,33 @@ def _forward(estimators, *x):
                 if test_loader:
                     self.eval()
                     with torch.no_grad():
-                        mse = 0.0
+                        val_loss = 0.0
                         for _, elem in enumerate(test_loader):
                             data, target = io.split_data_target(
                                 elem, self.device
                             )
                             output = _forward(estimators, *data)
-                            mse += criterion(output, target)
-                        mse /= len(test_loader)
+                            val_loss += self._criterion(output, target)
+                        val_loss /= len(test_loader)
 
-                        if mse < best_mse:
-                            best_mse = mse
+                        if val_loss < best_loss:
+                            best_loss = val_loss
                             self.estimators_ = nn.ModuleList()
                             self.estimators_.extend(estimators)
                             if save_model:
                                 io.save(self, save_dir, self.logger)
 
                         msg = (
-                            "Epoch: {:03d} | Validation MSE:"
+                            "Epoch: {:03d} | Validation Loss:"
                             " {:.5f} | Historical Best: {:.5f}"
                         )
-                        self.logger.info(msg.format(epoch, mse, best_mse))
+                        self.logger.info(
+                            msg.format(epoch, val_loss, best_loss)
+                        )
                         if self.tb_logger:
                             self.tb_logger.add_scalar(
-                                "adversirial_training/Validation_MSE",
-                                mse,
+                                "adversirial_training/Validation_Loss",
+                                val_loss,
                                 epoch,
                             )
 
 
@@ -123,6 +123,13 @@ def set_optimizer(self, optimizer_name, **kwargs):
     def set_scheduler(self, scheduler_name, **kwargs):
         super().set_scheduler(scheduler_name, **kwargs)
 
+    @torchensemble_model_doc(
+        """Set the training criterion for BaggingClassifier.""",
+        "set_criterion",
+    )
+    def set_criterion(self, criterion):
+        super().set_criterion(criterion)
+
     @torchensemble_model_doc(
         """Implementation on the training stage of BaggingClassifier.""", "fit"
     )
@@ -157,8 +164,11 @@ def fit(
                 optimizers[0], self.scheduler_name, **self.scheduler_args
             )
 
+        # Check the training criterion
+        if not hasattr(self, "_criterion"):
+            self._criterion = nn.CrossEntropyLoss()
+
         # Utils
-        criterion = nn.CrossEntropyLoss()
         best_acc = 0.0
 
         # Internal helper function on pesudo forward
@@ -192,7 +202,7 @@ def _forward(estimators, *x):
                         estimator,
                         cur_lr,
                         optimizer,
-                        criterion,
+                        self._criterion,
                         idx,
                         epoch,
                         log_interval,
@@ -295,6 +305,13 @@ def set_optimizer(self, optimizer_name, **kwargs):
     def set_scheduler(self, scheduler_name, **kwargs):
         super().set_scheduler(scheduler_name, **kwargs)
 
+    @torchensemble_model_doc(
+        """Set the training criterion for BaggingRegressor.""",
+        "set_criterion",
+    )
+    def set_criterion(self, criterion):
+        super().set_criterion(criterion)
+
     @torchensemble_model_doc(
         """Implementation on the training stage of BaggingRegressor.""", "fit"
     )
@@ -329,9 +346,12 @@ def fit(
                 optimizers[0], self.scheduler_name, **self.scheduler_args
             )
 
+        # Check the training criterion
+        if not hasattr(self, "_criterion"):
+            self._criterion = nn.MSELoss()
+
         # Utils
-        criterion = nn.MSELoss()
-        best_mse = float("inf")
+        best_loss = float("inf")
 
         # Internal helper function on pesudo forward
         def _forward(estimators, *x):
@@ -362,7 +382,7 @@ def _forward(estimators, *x):
                         estimator,
                         cur_lr,
                         optimizer,
-                        criterion,
+                        self._criterion,
                         idx,
                         epoch,
                         log_interval,
@@ -383,30 +403,32 @@ def _forward(estimators, *x):
                 if test_loader:
                     self.eval()
                     with torch.no_grad():
-                        mse = 0.0
+                        val_loss = 0.0
                         for _, elem in enumerate(test_loader):
                             data, target = io.split_data_target(
                                 elem, self.device
                             )
                             output = _forward(estimators, *data)
-                            mse += criterion(output, target)
-                        mse /= len(test_loader)
+                            val_loss += self._criterion(output, target)
+                        val_loss /= len(test_loader)
 
-                        if mse < best_mse:
-                            best_mse = mse
+                        if val_loss < best_loss:
+                            best_loss = val_loss
                             self.estimators_ = nn.ModuleList()
                             self.estimators_.extend(estimators)
                             if save_model:
                                 io.save(self, save_dir, self.logger)
 
                         msg = (
-                            "Epoch: {:03d} | Validation MSE:"
+                            "Epoch: {:03d} | Validation Loss:"
                             " {:.5f} | Historical Best: {:.5f}"
                         )
-                        self.logger.info(msg.format(epoch, mse, best_mse))
+                        self.logger.info(
+                            msg.format(epoch, val_loss, best_loss)
+                        )
                         if self.tb_logger:
                             self.tb_logger.add_scalar(
-                                "bagging/Validation_MSE", mse, epoch
+                                "bagging/Validation_Loss", val_loss, epoch
                             )
 
                 # Update the scheduler
Original file line number	Diff line number	Diff line change
`@@ -34,6 +34,9 @@ Example`
`34`	`34`	`estimator=base_estimator, # here is your deep learning model`
`35`	`35`	`n_estimators=10, # number of base estimators`
`36`	`36`	`)`
	`37`	`+ # Set the criterion`
	`38`	`+ criterion = nn.CrossEntropyLoss() # training objective`
	`39`	`+ ensemble.set_criterion(criterion)`
`37`	`40`
`38`	`41`	`# Set the optimizer`
`39`	`42`	`ensemble.set_optimizer(`