fix: resume training vs force first round loss handling, also for SNPE'

janfb · janfb · commit 6012fa1b2318 · 2024-08-14T09:37:20.000+02:00
diff --git a/sbi/inference/fmpe/fmpe_base.py b/sbi/inference/fmpe/fmpe_base.py
@@ -133,7 +133,7 @@ def train(
         max_num_epochs: int = 2**31 - 1,
         clip_max_norm: Optional[float] = 5.0,
         resume_training: bool = False,
-        train_with_proposal_without_correction: bool = False,
+        force_first_round_loss: bool = False,
         show_train_summary: bool = False,
         dataloader_kwargs: Optional[dict] = None,
     ) -> ConditionalDensityEstimator:
@@ -146,8 +146,11 @@ def train(
             stop_after_epochs: Number of epochs to train for. Defaults to 20.
             max_num_epochs: Maximum number of epochs to train for.
             clip_max_norm: Maximum norm for gradient clipping. Defaults to 5.0.
-            resume_training: Whether to resume training. Defaults to False.
-            train_with_proposal_without_correction: Whether to allow training with
+            resume_training: Can be used in case training time is limited, e.g. on a
+                cluster. If `True`, the split between train and validation set, the
+                optimizer, the number of epochs, and the best validation log-prob will
+                be restored from the last time `.train()` was called.
+            force_first_round_loss: Whether to allow training with
                 simulations that have not been sampled from the prior, e.g., in a
                 sequential inference setting. Note that can lead to biased inference
                 results.
@@ -162,16 +165,18 @@ def train(
         self._round = max(self._data_round_index)
 
         if self._round == 0 and self._neural_net is not None:
-            assert train_with_proposal_without_correction or resume_training, (
-                "You have already trained this neural network and now appended new "
-                "simulations with `append_simulations(theta, x)` without providing a "
-                "proposal. If the new simulations are sampled from the prior, you "
-                "can avoid this error by passing "
-                "`train_with_proposal_without_correction=True` to `train(...)` "
-                "However, if the new simulations were not "
-                "sampled from the prior, the result of FMPE will not be the true "
-                "posterior. Instead, it will be the proposal posterior, which "
-                "(usually) is more narrow than the true posterior. ",
+            assert force_first_round_loss or resume_training, (
+                "You have already trained this neural network. After you had trained "
+                "the network, you again appended simulations with `append_simulations"
+                "(theta, x)`, but you did not provide a proposal. If the new "
+                "simulations are sampled from the prior, you can set "
+                "`.train(..., force_first_round_loss=True`). However, if the new "
+                "simulations were not sampled from the prior, you should pass the "
+                "proposal, i.e. `append_simulations(theta, x, proposal)`. If "
+                "your samples are not sampled from the prior and you do not pass a "
+                "proposal and you set `force_first_round_loss=True`, the result of "
+                "FMPE will not be the true posterior. Instead, it will be the proposal "
+                "posterior, which (usually) is more narrow than the true posterior."
             )
 
         start_idx = 0  # as there is no multi-round FMPE yet
diff --git a/sbi/inference/snpe/snpe_base.py b/sbi/inference/snpe/snpe_base.py
@@ -263,7 +263,7 @@ def train(
         self._round = max(self._data_round_index)
 
         if self._round == 0 and self._neural_net is not None:
-            assert force_first_round_loss, (
+            assert force_first_round_loss or resume_training, (
                 "You have already trained this neural network. After you had trained "
                 "the network, you again appended simulations with `append_simulations"
                 "(theta, x)`, but you did not provide a proposal. If the new "
diff --git a/tests/linearGaussian_fmpe_test.py b/tests/linearGaussian_fmpe_test.py
@@ -214,7 +214,7 @@ def test_c2st_fmpe_for_different_dims_and_resume_training(density_estimator="mlp
     )
 
     inference = inference.append_simulations(theta, x)
-    posterior_estimator = inference.train(max_num_epochs=10)
+    posterior_estimator = inference.train(max_num_epochs=2)
     # Test whether we can stop and resume.
     posterior_estimator = inference.train(resume_training=True)
 
@@ -416,5 +416,5 @@ def test_multi_round_handling_fmpe():
 
     # Append new data with a proposal. This should work without any issues.
     inference.append_simulations(theta_new, x_new).train(
-        max_num_epochs=2, train_with_proposal_without_correction=True
+        max_num_epochs=2, force_first_round_loss=True
     )

Original file line number	Diff line number	Diff line change
`@@ -214,7 +214,7 @@ def test_c2st_fmpe_for_different_dims_and_resume_training(density_estimator="mlp`
`214`	`214`	`)`
`215`	`215`
`216`	`216`	`inference = inference.append_simulations(theta, x)`
`217`		`- posterior_estimator = inference.train(max_num_epochs=10)`
	`217`	`+ posterior_estimator = inference.train(max_num_epochs=2)`
`218`	`218`	`# Test whether we can stop and resume.`
`219`	`219`	`posterior_estimator = inference.train(resume_training=True)`
`220`	`220`
`@@ -416,5 +416,5 @@ def test_multi_round_handling_fmpe():`
`416`	`416`
`417`	`417`	`# Append new data with a proposal. This should work without any issues.`
`418`	`418`	`inference.append_simulations(theta_new, x_new).train(`
`419`		`- max_num_epochs=2, train_with_proposal_without_correction=True`
	`419`	`+ max_num_epochs=2, force_first_round_loss=True`
`420`	`420`	`)`