[ENH] Fix the parallelization issue on logging

zzzzwj · zzzzwj · xuyxu · web-flow · commit cc79216a3cad · 2021-01-28T19:10:19.000+08:00
* Create the pytest script for logging module

* Fix warnings raised by flake8

* formalize the name of my function

* Replace python.logging with MultiProcessing-Logging module

* Eliminate warnings produced by flake8

* Fix one small bug

* remove the debug script

* Replace multiprocessing logger with print

* Remove the test_logging script which isn't able to work on Windows

* Write log before parallelization

* restore the example on classification

Co-authored-by: zzzzwj &lt;zwj@nju.edu.cn&gt;
Co-authored-by: Yi-Xuan Xu &lt;xuyx@lamda.nju.edu.cn&gt;
diff --git a/torchensemble/adversarial_training.py b/torchensemble/adversarial_training.py
@@ -270,6 +270,11 @@ def _forward(estimators, data):
             # Training loop
             for epoch in range(epochs):
                 self.train()
+
+                if self.n_jobs and self.n_jobs > 1:
+                    msg = "Parallelization on the training epoch: {:03d}"
+                    self.logger.info(msg.format(epoch))
+
                 rets = parallel(delayed(_parallel_fit_per_epoch)(
                         train_loader,
                         epsilon,
@@ -431,6 +436,11 @@ def _forward(estimators, data):
             # Training loop
             for epoch in range(epochs):
                 self.train()
+
+                if self.n_jobs and self.n_jobs > 1:
+                    msg = "Parallelization on the training epoch: {:03d}"
+                    self.logger.info(msg.format(epoch))
+
                 rets = parallel(delayed(_parallel_fit_per_epoch)(
                         train_loader,
                         epsilon,
diff --git a/torchensemble/bagging.py b/torchensemble/bagging.py
@@ -38,8 +38,6 @@ def _parallel_fit_per_epoch(train_loader,
     out-of-memory error.
     """
 
-    msg_list = []
-
     for batch_idx, (data, target) in enumerate(train_loader):
 
         batch_size = data.size(0)
@@ -70,14 +68,14 @@ def _parallel_fit_per_epoch(train_loader,
 
                 msg = ("Estimator: {:03d} | Epoch: {:03d} | Batch: {:03d}"
                        " | Loss: {:.5f} | Correct: {:d}/{:d}")
-                msg_list.append(msg.format(idx, epoch, batch_idx, loss,
-                                           correct, subsample_size))
+                print(msg.format(idx, epoch, batch_idx, loss,
+                                 correct, subsample_size))
             else:
                 msg = ("Estimator: {:03d} | Epoch: {:03d} | Batch: {:03d}"
                        " | Loss: {:.5f}")
-                msg_list.append(msg.format(idx, epoch, batch_idx, loss))
+                print(msg.format(idx, epoch, batch_idx, loss))
 
-    return estimator, optimizer, msg_list
+    return estimator, optimizer
 
 
 @torchensemble_model_doc("""Implementation on the BaggingClassifier.""",
@@ -160,6 +158,11 @@ def _forward(estimators, data):
             # Training loop
             for epoch in range(epochs):
                 self.train()
+
+                if self.n_jobs and self.n_jobs > 1:
+                    msg = "Parallelization on the training epoch: {:03d}"
+                    self.logger.info(msg.format(epoch))
+
                 rets = parallel(delayed(_parallel_fit_per_epoch)(
                         train_loader,
                         estimator,
@@ -176,12 +179,9 @@ def _forward(estimators, data):
                 )
 
                 estimators, optimizers = [], []
-                for estimator, optimizer, msgs in rets:
+                for estimator, optimizer in rets:
                     estimators.append(estimator)
                     optimizers.append(optimizer)
-                    # Write logging info
-                    for msg in msgs:
-                        self.logger.info(msg)
 
                 # Validation
                 if test_loader:
@@ -317,6 +317,11 @@ def _forward(estimators, data):
             # Training loop
             for epoch in range(epochs):
                 self.train()
+
+                if self.n_jobs and self.n_jobs > 1:
+                    msg = "Parallelization on the training epoch: {:03d}"
+                    self.logger.info(msg.format(epoch))
+
                 rets = parallel(delayed(_parallel_fit_per_epoch)(
                         train_loader,
                         estimator,
@@ -333,12 +338,9 @@ def _forward(estimators, data):
                 )
 
                 estimators, optimizers = [], []
-                for estimator, optimizer, msgs in rets:
+                for estimator, optimizer in rets:
                     estimators.append(estimator)
                     optimizers.append(optimizer)
-                    # Write logging info
-                    for msg in msgs:
-                        self.logger.info(msg)
 
                 # Validation
                 if test_loader:
diff --git a/torchensemble/voting.py b/torchensemble/voting.py
@@ -37,8 +37,6 @@ def _parallel_fit_per_epoch(train_loader,
     out-of-memory error.
     """
 
-    msg_list = []
-
     for batch_idx, (data, target) in enumerate(train_loader):
 
         batch_size = data.size(0)
@@ -60,15 +58,15 @@ def _parallel_fit_per_epoch(train_loader,
 
                 msg = ("Estimator: {:03d} | Epoch: {:03d} | Batch: {:03d}"
                        " | Loss: {:.5f} | Correct: {:d}/{:d}")
-                msg_list.append(msg.format(idx, epoch, batch_idx, loss,
-                                correct, batch_size))
+                print(msg.format(idx, epoch, batch_idx, loss,
+                                 correct, batch_size))
             # Regression
             else:
                 msg = ("Estimator: {:03d} | Epoch: {:03d} | Batch: {:03d}"
                        " | Loss: {:.5f}")
-                msg_list.append(msg.format(idx, epoch, batch_idx, loss))
+                print(msg.format(idx, epoch, batch_idx, loss))
 
-    return estimator, optimizer, msg_list
+    return estimator, optimizer
 
 
 @torchensemble_model_doc("""Implementation on the VotingClassifier.""",
@@ -151,6 +149,11 @@ def _forward(estimators, data):
             # Training loop
             for epoch in range(epochs):
                 self.train()
+
+                if self.n_jobs and self.n_jobs > 1:
+                    msg = "Parallelization on the training epoch: {:03d}"
+                    self.logger.info(msg.format(epoch))
+
                 rets = parallel(delayed(_parallel_fit_per_epoch)(
                         train_loader,
                         estimator,
@@ -167,12 +170,9 @@ def _forward(estimators, data):
                 )
 
                 estimators, optimizers = [], []
-                for estimator, optimizer, msgs in rets:
+                for estimator, optimizer in rets:
                     estimators.append(estimator)
                     optimizers.append(optimizer)
-                    # Write logging info
-                    for msg in msgs:
-                        self.logger.info(msg)
 
                 # Validation
                 if test_loader:
@@ -309,6 +309,11 @@ def _forward(estimators, data):
             # Training loop
             for epoch in range(epochs):
                 self.train()
+
+                if self.n_jobs and self.n_jobs > 1:
+                    msg = "Parallelization on the training epoch: {:03d}"
+                    self.logger.info(msg.format(epoch))
+
                 rets = parallel(delayed(_parallel_fit_per_epoch)(
                         train_loader,
                         estimator,
@@ -325,12 +330,9 @@ def _forward(estimators, data):
                 )
 
                 estimators, optimizers = [], []
-                for estimator, optimizer, msgs in rets:
+                for estimator, optimizer in rets:
                     estimators.append(estimator)
                     optimizers.append(optimizer)
-                    # Write logging info
-                    for msg in msgs:
-                        self.logger.info(msg)
 
                 # Validation
                 if test_loader: