Merge branch 'popsim-consortium:main' into handle_test_warnings

popsim-consortium · Dec 23, 2024 · 8b1b4ee · 8b1b4ee
2 parents ca04e54 + d6e0406
commit 8b1b4ee
Show file tree

Hide file tree

Showing 3 changed files with 90 additions and 16 deletions.
diff --git a/.github/ISSUE_TEMPLATE/dfe-qc-issue-template.md b/.github/ISSUE_TEMPLATE/dfe-qc-issue-template.md
@@ -0,0 +1,17 @@
+---
+name: DFE QC issue template
+about: Quality control process for DFE addition
+title: QC for {dfe_id} ({species})
+labels: DFE QC
+assignees: ''
+
+---
+
+**PR for new model:** {link to Pull Request}
+**Original paper:** {ink to original paper}
+**Parameter values:** {reference to where parameter values can be found}
+
+**Potential issues that might lead to differences between the model implementations:**
+{description of any potential issues}
+
+**QC'er requests:** {tag potential developers to QC the model}
diff --git a/docs/development.rst b/docs/development.rst
@@ -1652,7 +1652,7 @@ Testing your DFE model and submitting a PR
 
 After you finished your implementation, and specified all the
 necessary citations,
-we recommend that you run some basic local tests to see that
+we recommend that you run some basic local checks to see that
 the model was successfully loaded to ``stdpopsim``.
 You may follow the process outlined for `Testing your demographic model and submitting a PR`_.
 
@@ -1667,24 +1667,31 @@ of the development team before it is fully incorporated into ``stdpopsim``.
 This will likely require additional feedback from you,
 so, stay tuned for discussion during the review process.
 
+To facilitate this, there is one more step: please open a
+`new issue <https://github.com/popsim-consortium/stdpopsim/issues/new>`__,
+using the "DFE QC" template.
+The template asks for the basic information that someone will need
+to independently verify the implemented DFE.
+
 ---------------------
 Reviewing a DFE model
 ---------------------
 
-The review process for DFE models is currently being developed.
-For now, we suggest that you
-`open a new blank issue <https://github.com/popsim-consortium/stdpopsim/issues/new>`__
-and specify the following information:
+The process for reviewing a DFE is essentially the same
+as for reviewing a demographic model (see `Overview of the stdpopsim review process`_).
+Briefly, you will re-implement the DFE "blind", i.e., without looking at the DFE
+implementation already added to the code.
+Then, the unit tests check whether the implementations are equivalent.
+To do this, you add your implementation to ``stdpopsim/qc/<SPECIES_ID>.py``,
+followed by a call like
+
+.. code-block:: python
 
-1. **PR for new model:**
-2. **Original paper:**
-3. **Parameter values:**
-4. **Potential issues:**
-5. **QC'er requests:**
+    _species.get_dfe(_MODEL_ID_).register_qc(_your_review_function())
 
-A reviewer will be assigned to check your implementation and approve it.
-All discussion about the review can be conducted in the **QC issue**
-mentioned above.
+where ``_MODEL_ID_`` is the string specified as the ID for the original DFE,
+and ``_your_review_function()`` is the function you've added to the QC file
+that returns a DFE object.
 
 ****************
 Coding standards

diff --git a/tests/test_slim_engine.py b/tests/test_slim_engine.py
@@ -321,6 +321,30 @@ def test_recap_and_rescale_on_external_slim_run(self, tmp_path):
         assert tables1.edges == tables2.edges
         assert tables1.mutations == tables2.mutations
 
+    def test_recap_start_time(self):
+        # check that the correct time to start adding mutations from
+        # is actually the value recorded in metadata (whether it is or
+        # differs by 1 or 2 depends on the stages in which the simulation
+        # is set up and written out; see pyslim:#308
+        engine = stdpopsim.get_engine("slim")
+        species = stdpopsim.get_species("AnaPla")
+        contig = species.get_contig(length=1e3)
+        model = stdpopsim.PiecewiseConstantSize(100)
+        samples = {"pop_0": 10}
+        ts = engine.simulate(
+            demographic_model=model,
+            contig=contig,
+            samples=samples,
+            slim_burn_in=3,
+            _recap_and_rescale=False,
+        )
+        root_times = set([ts.node(n).time for t in ts.trees() for n in t.roots])
+        assert root_times == set(
+            [
+                ts.metadata["SLiM"]["cycle"],
+            ]
+        )
+
     def test_assert_min_version(self):
         engine = stdpopsim.get_engine("slim")
         with mock.patch(
@@ -1149,6 +1173,7 @@ def test_chr1(self, Q):
             samples=samples,
             slim_burn_in=0.1,
             verbosity=3,
+            seed=888,
         )
         self.verify_recombination_map(contig, ts)
 
@@ -1171,6 +1196,7 @@ def test_off_by_one(self):
             samples=samples,
             slim_burn_in=0.1,
             verbosity=3,
+            seed=456,
         )
         self.verify_recombination_map(contig, ts)
         assert list(ts.breakpoints()) == [0.0, midpoint, contig.length]
@@ -1526,6 +1552,7 @@ def test_default_dfe(self):
             contig=contig,
             samples=self.samples,
             verbosity=3,  # to get metadata output
+            seed=135,
         )
         self.verify_genomic_elements(contig, ts)
         self.verify_mutation_rates(contig, ts)
@@ -1545,6 +1572,7 @@ def test_multiple_dfes(self):
             contig=contig,
             samples=self.samples,
             verbosity=3,  # to get metadata output
+            seed=246,
         )
         self.verify_genomic_elements(contig, ts)
         self.verify_mutation_rates(contig, ts)
@@ -1562,6 +1590,7 @@ def test_unused_dfe(self):
             contig=contig,
             samples=self.samples,
             verbosity=3,  # to get metadata output
+            seed=357,
         )
         self.verify_genomic_elements(contig, ts)
         self.verify_mutation_rates(contig, ts)
@@ -1596,6 +1625,7 @@ def test_same_dfes(self):
             contig=contig,
             samples=self.samples,
             verbosity=3,  # to get metadata output
+            seed=468,
         )
         self.verify_genomic_elements(contig, ts)
         self.verify_mutation_rates(contig, ts)
@@ -1624,6 +1654,7 @@ def test_slim_produces_mutations(self):
             slim_scaling_factor=10,
             slim_burn_in=0.1,
             verbosity=3,  # to get metadata output
+            seed=579,
             _recap_and_rescale=False,
         )
         assert ts.num_sites > 0
@@ -1640,6 +1671,7 @@ def test_no_neutral_mutations_are_simulated_by_slim(self):
             slim_scaling_factor=10,
             slim_burn_in=0.1,
             verbosity=3,
+            seed=147,
             _recap_and_rescale=False,
         )
         assert ts.num_sites == 0
@@ -1658,6 +1690,7 @@ def test_no_neutral_mutations_are_simulated_by_slim(self):
             slim_scaling_factor=10,
             slim_burn_in=0.1,
             verbosity=3,
+            seed=258,
             _recap_and_rescale=False,
         )
         assert ts.num_sites == 0
@@ -1676,6 +1709,7 @@ def test_neutral_dfe_slim_proportions(self):
             slim_scaling_factor=Q,
             slim_burn_in=0.1,
             verbosity=3,
+            seed=369,
             _recap_and_rescale=False,
         )
         ge_types = self.slim_metadata_key0(
@@ -1708,6 +1742,7 @@ def test_neutral_dfe_slim_proportions(self):
             slim_scaling_factor=Q,
             slim_burn_in=0.1,
             verbosity=3,
+            seed=470,
             _recap_and_rescale=False,
         )
         ge_types = self.slim_metadata_key0(
@@ -1757,6 +1792,7 @@ def test_chromosomal_segment(self):
             contig=contig,
             samples=self.samples,
             verbosity=3,  # to get metadata output
+            seed=159,
         )
         self.verify_genomic_elements(contig, ts)
         self.verify_mutation_rates(contig, ts)
@@ -1837,6 +1873,7 @@ def test_dominance_coeff_list(self):
             contig=contig,
             samples=self.samples,
             verbosity=3,  # to get metadata output
+            seed=260,
         )
         assert len(ts.metadata["stdpopsim"]["DFEs"]) == len(contig.dfe_list) + 1
         # slim mutation type IDs with dominance coeff lists:
@@ -2220,6 +2257,7 @@ def test_drawn_mutation_not_lost(self):
             extended_events=extended_events,
             slim_scaling_factor=10,
             slim_burn_in=0.1,
+            seed=321,
             _recap_and_rescale=False,
         )
         assert ts.num_mutations == 1
@@ -2252,6 +2290,7 @@ def test_drawn_mutation_is_lost(self):
             extended_events=extended_events,
             slim_scaling_factor=10,
             slim_burn_in=0.1,
+            seed=432,
             _recap_and_rescale=False,
         )
         assert ts.num_mutations == 0
@@ -2478,6 +2517,7 @@ def test_referenced_single_site_is_nonneutral(self):
             contig=contig,
             samples=self.samples,
             extended_events=extended_events,
+            seed=543,
         )
         referenced_dfe = ts.metadata["stdpopsim"]["DFEs"][1]
         assert referenced_dfe["id"] == "one"
@@ -2694,6 +2734,7 @@ def test_sweep(self, tmp_path):
                     slim_burn_in=1,
                     logfile=logfile,
                     logfile_interval=1,
+                    seed=654,
                 )
                 in_sweep, outside_sweep, _ = self._fitness_per_generation(
                     logfile=logfile,
@@ -2737,6 +2778,7 @@ def test_sweep_meets_min_freq_at_start(self, tmp_path):
                 slim_burn_in=1,
                 logfile=logfile,
                 logfile_interval=1,
+                seed=654,
             )
             in_sweep, outside_sweep, rejections = self._fitness_per_generation(
                 logfile=logfile,
@@ -2784,6 +2826,7 @@ def test_sweep_meets_min_freq_at_end(self, tmp_path):
                 slim_burn_in=1,
                 logfile=logfile,
                 logfile_interval=1,
+                seed=765,
             )
             in_sweep, outside_sweep, rejections = self._fitness_per_generation(
                 logfile=logfile,
@@ -2865,6 +2908,7 @@ def test_global_sweep(self, tmp_path):
                 slim_burn_in=1,
                 logfile=logfile,
                 logfile_interval=1,
+                seed=876,
             )
             p0_in_sweep, p0_outside_sweep, _ = self._fitness_per_generation(
                 logfile=logfile,
@@ -2917,6 +2961,7 @@ def test_local_sweep(self, tmp_path):
             slim_burn_in=1,
             logfile=logfile,
             logfile_interval=1,
+            seed=987,
         )
         p0_in_sweep, p0_outside_sweep, _ = self._fitness_per_generation(
             logfile=logfile,
@@ -2972,6 +3017,7 @@ def test_sweeps_at_multiple_sites(self, tmp_path):
             slim_burn_in=1,
             logfile=logfile,
             logfile_interval=1,
+            seed=531,
         )
         for i, _ in enumerate(pop_ids):
             in_sweep, outside_sweep, _ = self._fitness_per_generation(
@@ -3024,6 +3070,7 @@ def test_sweep_with_background_selection(self, tmp_path):
             slim_burn_in=1,
             logfile=logfile,
             logfile_interval=1,
+            seed=642,
         )
         p0_in_sweep, p0_outside_sweep, _ = self._fitness_per_generation(
             logfile=logfile,
@@ -3071,6 +3118,7 @@ def test_stacked(self):
                 contig=contig,
                 samples=self.samples,
                 slim_burn_in=10,
+                seed=753,
             )
             is_stacked = [len(m.metadata["mutation_list"]) > 1 for m in ts.mutations()]
             if any(is_stacked):
@@ -3093,6 +3141,7 @@ def test_msprime(self):
                 demographic_model=self.model,
                 contig=contig,
                 samples=self.samples,
+                seed=864,
             )
             if ts.num_mutations > 0:
                 break
@@ -3109,6 +3158,7 @@ def test_errors(self):
                 demographic_model=self.model,
                 contig=contig,
                 samples=self.samples,
+                seed=975,
             )
             if ts.num_mutations > 0:
                 break
@@ -3256,7 +3306,7 @@ def test_slim_population_size_diploid(self, caplog):
         contig = stdpopsim.Contig.basic_contig(length=1000, ploidy=2)
         model = stdpopsim.PiecewiseConstantSize(N)
         with caplog.at_level(logging.DEBUG):
-            engine.simulate(model, contig, samples={"pop_0": 2}, verbosity=2)
+            engine.simulate(model, contig, samples={"pop_0": 2}, verbosity=2, seed=9)
         log_str = " ".join([rec.getMessage() for rec in caplog.records])
         # match: "1: p = sim.addSubpop(0, <SLiM population size>);"
         extract_ne = re.compile(".+1: p = sim.addSubpop\\(0, ([0-9]+)\\).+")
@@ -3294,7 +3344,7 @@ def test_individual_ploidy(self):
         engine = stdpopsim.get_engine("slim")
         for ploidy in [1, 2]:
             contig = stdpopsim.Contig.basic_contig(length=1000, ploidy=ploidy)
-            ts = engine.simulate(model, contig, samples={"pop_0": 2})
+            ts = engine.simulate(model, contig, samples={"pop_0": 2}, seed=8)
             assert ts.num_individuals == 2
             assert ts.num_samples == 2 * ploidy
             individual = ts.tables.nodes.individual
@@ -3306,7 +3356,7 @@ def test_haploidize_individuals(self):
         model = stdpopsim.PiecewiseConstantSize(N)
         engine = stdpopsim.get_engine("slim")
         contig = stdpopsim.Contig.basic_contig(length=1000, ploidy=2)
-        ts = engine.simulate(model, contig, samples={"pop_0": 3})
+        ts = engine.simulate(model, contig, samples={"pop_0": 3}, seed=7)
         ts_hap = stdpopsim.utils.haploidize_individuals(ts)
         assert ts_hap.num_individuals == ts.num_individuals * 2
         for i, j in zip(ts.samples(), ts_hap.samples()):