Skip to content

Commit

Permalink
modified citation info for Lauterbur et al. (2023) in docs
Browse files Browse the repository at this point in the history
Implemented PhoSin species (Vaquita). First version (before QC)
  • Loading branch information
igronau committed Sep 13, 2023
1 parent 9ed687c commit bf0b81d
Show file tree
Hide file tree
Showing 4 changed files with 235 additions and 38 deletions.
69 changes: 31 additions & 38 deletions docs/introduction.rst
Original file line number Diff line number Diff line change
Expand Up @@ -77,24 +77,24 @@ major additions to the catalog:
Travis J Struck, Simon Gravel, Ryan N Gutenkunst, Kirk E Lohmeuller,
Peter L Ralph, Daniel R Schrider, Adam Siepel, Jerome Kelleher, Andrew D Kern (2020),
*A community-maintained standard library of population genetic models*,
eLife 2020;9:e54967; doi: https://doi.org/10.7554/eLife.54967

- M. Elise Lauterbur, Mariz Izabel A. Cavassim, Ariella L. Gladstein, Graham
Gower, Nathaniel S. Pope, Georgia Tsambos, Jeffrey Adrion, Saurabh Belsare,
Arjun Biddanda, Victoria Caudill, Jean Cury, Ignacio Echevarria, Benjamin C.
Haller, Ahmed R. Hasan, Xin Huang, Leonardo Nicola Martin Iasi, Ekaterina
Noskova, Jana Obšteter, Vitor Antonio Corrêa Pavinato, Alice Pearson, David
Peede, Manolo F. Perez, Murillo F. Rodrigues, Chris C. R. Smith, Jeffrey P.
Spence, Anastasia Teterina, Silas Tittes, Per Unneberg, Juan Manuel Vazquez,
Ryan K. Waples, Anthony Wilder Wohns, Yan Wong, Franz Baumdicker, Reed A.
Cartwright, Gregor Gorjanc, Ryan N. Gutenkunst, Jerome Kelleher, Andrew D.
Kern, Aaron P. Ragsdale, Peter L. Ralph, Daniel R. Schrider, Ilan Gronau (2022).
eLife 9:e54967; doi: https://doi.org/10.7554/eLife.54967

- M. Elise Lauterbur, Maria Izabel A. Cavassim, Ariella L. Gladstein, Graham Gower,
Nathaniel S. Pope, Georgia Tsambos, Jeff Adrion, Saurabh Belsare, Arjun Biddanda,
Victoria Caudill, Jean Cury, Ignacio Echevarria, Benjamin C. Haller, Ahmed R. Hasan,
Xin Huang, Leonardo Nicola Martin Iasi, Ekaterina Noskova, Jana Obšteter,
Vitor Antonio Corrêa Pavinato, Alice Pearson, David Peede, Manolo F. Perez,
Murillo F. Rodrigues, Chris C. R. Smith, Jeffrey P. Spence, Anastasia Teterina,
Silas Tittes, Per Unneberg, Juan Manuel Vazquez, Ryan K. Waples, Anthony Wilder Wohns,
Yan Wong, Franz Baumdicker, Reed A. Cartwright, Gregor Gorjanc, Ryan N. Gutenkunst,
Jerome Kelleher, Andrew D. Kern, Aaron P. Ragsdale, Peter L. Ralph, Daniel R. Schrider,
Ilan Gronau (2023)
*Expanding the stdpopsim species catalog, and lessons learned for realistic genome simulations*,
bioRxiv 2022.10.29.514266; doi: https://doi.org/10.1101/2022.10.29.514266
eLife 12:RP84874; doi: https://doi.org/10.7554/eLife.84874.2

Bibtex records::

@article {10.7554/eLife.54967,
@article {10.7554/eLife.54967,
article_type = {journal},
title = {A community-maintained standard library of population genetic models},
author = {Adrion, Jeffrey R and Cole, Christopher B and Dukler, Noah and Galloway, Jared
Expand All @@ -121,30 +121,23 @@ Bibtex records::
publisher = {eLife Sciences Publications, Ltd},
}

@article {Lauterbur2022.10.29.514266,
author = {Lauterbur, M. Elise and Cavassim, Mariz Izabel A. and
Gladstein, Ariella L. and Gower, Graham and Pope, Nathaniel S. and
Tsambos, Georgia and Adrion, Jeffrey and Belsare, Saurabh and Biddanda,
Arjun and Caudill, Victoria and Cury, Jean and Echevarria, Ignacio and
Haller, Benjamin C. and Hasan, Ahmed R. and Huang, Xin and Iasi,
Leonardo Nicola Martin and Noskova, Ekaterina and Ob{\v s}teter, Jana
and Pavinato, Vitor Antonio Corr{\^e}a and Pearson, Alice and Peede,
David and Perez, Manolo F. and Rodrigues, Murillo F. and Smith, Chris
C. R. and Spence, Jeffrey P. and Teterina, Anastasia and Tittes, Silas
and Unneberg, Per and Vazquez, Juan Manuel and Waples, Ryan K. and
Wohns, Anthony Wilder and Wong, Yan and Baumdicker, Franz and
Cartwright, Reed A. and Gorjanc, Gregor and Gutenkunst, Ryan N. and
Kelleher, Jerome and Kern, Andrew D. and Ragsdale, Aaron P. and Ralph,
Peter L. and Schrider, Daniel R. and Gronau, Ilan},
title = {Expanding the stdpopsim species catalog, and lessons learned
for realistic genome simulations},
elocation-id = {2022.10.29.514266},
year = {2022},
doi = {10.1101/2022.10.29.514266},
publisher = {Cold Spring Harbor Laboratory},
URL = {https://www.biorxiv.org/content/early/2022/10/31/2022.10.29.514266},
eprint = {https://www.biorxiv.org/content/early/2022/10/31/2022.10.29.514266.full.pdf},
journal = {bioRxiv}
@article{10.7554/eLife.84874.2,
title={Expanding the stdpopsim species catalog, and lessons learned for realistic genome simulations},
author = {M. Elise Lauterbur and Maria Izabel A. Cavassim and Ariella L. Gladstein and Graham Gower and
Nathaniel S. Pope and Georgia Tsambos and Jeff Adrion and Saurabh Belsare and Arjun Biddanda and
Victoria Caudill and Jean Cury and Ignacio Echevarria and Benjamin C. Haller and Ahmed R. Hasan and
Xin Huang and Leonardo Nicola Martin Iasi and Ekaterina Noskova and Jana Ob{\v{s}}teter and
Vitor Antonio Corr{\^{e}}a Pavinato and Alice Pearson and David Peede and Manolo F. Perez and
Murillo F. Rodrigues and Chris C. R. Smith and Jeffrey P. Spence and Anastasia Teterina and
Silas Tittes and Per Unneberg and Juan Manuel Vazquez and Ryan K. Waples and Anthony Wilder Wohns and
Yan Wong and Franz Baumdicker and Reed A. Cartwright and Gregor Gorjanc and Ryan N. Gutenkunst and
Jerome Kelleher and Andrew D. Kern and Aaron P. Ragsdale and Peter L. Ralph and Daniel R. Schrider and
Ilan Gronau},
doi = {10.7554/elife.84874.2},
url = {https://doi.org/10.7554/elife.84874.2},
year = 2023,
month = {may},
publisher = {{eLife} Sciences Publications, Ltd},
}


Expand Down
4 changes: 4 additions & 0 deletions stdpopsim/catalog/PhoSin/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
"""
Catalog definitions for PhoSin (Ensembl ID='phocoena_sinus')
"""
from . import species # noqa: F401
29 changes: 29 additions & 0 deletions stdpopsim/catalog/PhoSin/genome_data.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,29 @@
# File autogenerated from Ensembl REST API. Do not edit.
data = {
"assembly_accession": "GCA_008692025.1",
"assembly_name": "mPhoSin1.pri",
"chromosomes": {
"1": {"length": 185845356, "synonyms": []},
"2": {"length": 178563925, "synonyms": []},
"3": {"length": 174291665, "synonyms": []},
"4": {"length": 146127150, "synonyms": []},
"5": {"length": 139762554, "synonyms": []},
"6": {"length": 115952311, "synonyms": []},
"7": {"length": 115469292, "synonyms": []},
"8": {"length": 110408561, "synonyms": []},
"9": {"length": 106736052, "synonyms": []},
"10": {"length": 102828027, "synonyms": []},
"11": {"length": 104118372, "synonyms": []},
"12": {"length": 90399378, "synonyms": []},
"13": {"length": 90400161, "synonyms": []},
"14": {"length": 89762611, "synonyms": []},
"15": {"length": 88287594, "synonyms": []},
"16": {"length": 85252673, "synonyms": []},
"17": {"length": 79603858, "synonyms": []},
"18": {"length": 79885847, "synonyms": []},
"19": {"length": 59501331, "synonyms": []},
"20": {"length": 58878645, "synonyms": []},
"21": {"length": 35802323, "synonyms": []},
"X": {"length": 131664873, "synonyms": []},
},
}
171 changes: 171 additions & 0 deletions stdpopsim/catalog/PhoSin/species.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,171 @@
import stdpopsim

from . import genome_data

_species_ploidy = 2
_ploidy = {
"1": _species_ploidy,
"2": _species_ploidy,
"3": _species_ploidy,
"4": _species_ploidy,
"5": _species_ploidy,
"6": _species_ploidy,
"7": _species_ploidy,
"8": _species_ploidy,
"9": _species_ploidy,
"10": _species_ploidy,
"11": _species_ploidy,
"12": _species_ploidy,
"13": _species_ploidy,
"14": _species_ploidy,
"15": _species_ploidy,
"16": _species_ploidy,
"17": _species_ploidy,
"18": _species_ploidy,
"19": _species_ploidy,
"20": _species_ploidy,
"21": _species_ploidy,
"X": _species_ploidy,
}

# There is no good justificaiton for this value for now.
# We're using the value of 1e-8, which appears to be what
# Morin et al. (2021) used in their PSMC analysis
# (the default value), but I'm not sure, and this is not
# well justified
_overall_recombination_rate = 1e-8
_recombination_rate = {
"1": _overall_recombination_rate,
"2": _overall_recombination_rate,
"3": _overall_recombination_rate,
"4": _overall_recombination_rate,
"5": _overall_recombination_rate,
"6": _overall_recombination_rate,
"7": _overall_recombination_rate,
"8": _overall_recombination_rate,
"9": _overall_recombination_rate,
"10": _overall_recombination_rate,
"11": _overall_recombination_rate,
"12": _overall_recombination_rate,
"13": _overall_recombination_rate,
"14": _overall_recombination_rate,
"15": _overall_recombination_rate,
"16": _overall_recombination_rate,
"17": _overall_recombination_rate,
"18": _overall_recombination_rate,
"19": _overall_recombination_rate,
"20": _overall_recombination_rate,
"21": _overall_recombination_rate,
"X": _overall_recombination_rate,
}

# Genome-wide average mutation rate is estimated by Robinson et al. (2022)
# by using divergence from two closely related species: harbor porpoise
# (Phocoena phocoena) and Indo-Pacific finless porpoise (Neophocaena phocaenoides).
# Using these two species and a range of assumptions results in a range of
# plausible estimates depicted in Fig S12 in the paper.
# Eventually, the representative value used in most analyses in the paper was
# 5.83e-9, which is on the high side of the range, to take into account previous
# higher estimates of the mutation rate, cited by Morin et al. (2021).
_overall_mutation_rate = 5.83e-9

_mutation_rate = {
"1": _overall_mutation_rate,
"2": _overall_mutation_rate,
"3": _overall_mutation_rate,
"4": _overall_mutation_rate,
"5": _overall_mutation_rate,
"6": _overall_mutation_rate,
"7": _overall_mutation_rate,
"8": _overall_mutation_rate,
"9": _overall_mutation_rate,
"10": _overall_mutation_rate,
"11": _overall_mutation_rate,
"12": _overall_mutation_rate,
"13": _overall_mutation_rate,
"14": _overall_mutation_rate,
"15": _overall_mutation_rate,
"16": _overall_mutation_rate,
"17": _overall_mutation_rate,
"18": _overall_mutation_rate,
"19": _overall_mutation_rate,
"20": _overall_mutation_rate,
"21": _overall_mutation_rate,
"X": _overall_mutation_rate,
}

_genome = stdpopsim.Genome.from_data(
genome_data.data,
recombination_rate=_recombination_rate,
mutation_rate=_mutation_rate,
ploidy=_ploidy,
# [ Implementers: please insert citations for the papers you are basing
# the estimates for recombination and mutation rates. The assembly
# citation is optional and can be deleted if not needed.]
citations=[
stdpopsim.Citation(
author="Morin et al.",
year=2021,
doi="https://doi.org/10.1111/1755-0998.13284",
reasons={stdpopsim.CiteReason.ASSEMBLY},
),
stdpopsim.Citation(
author="Morin et al.",
year=2021,
doi="https://doi.org/10.1111/1755-0998.13284",
reasons={stdpopsim.CiteReason.REC_RATE},
),
stdpopsim.Citation(
author="Robinson et al.",
year=2022,
doi="https://doi.org/10.1126/science.abm1742",
reasons={stdpopsim.CiteReason.MUT_RATE},
),
],
)

_species = stdpopsim.Species(
id="PhoSin",
ensembl_id="phocoena_sinus",
name="Phocoena sinus",
common_name="Vaquita",
genome=_genome,
# Robinson et al. (2022) and Morin et al. (2021) assumed an average
# generation time of 11.9 years in their analyses/calibrations.
# They cite Taylor et al. (2007) as a primary source.
# Table 1 in that paper specifies estimates of generation
# times for 58 cetacean species. It seems like the value selected was
# the one inferred for the sister species of harbor porpoise (Phocoena
# phocoena). The value estimated for Vaquita is slightly smaller (11.4),
# but maybe it reflects a recent reducion in generation time (???)
generation_time=11.9,
# Demographic models inferred for Vaquita by Morin et al. (2021) and
# Robinson et al. (2022) typically estimate small Ne of 2,000 - 5,000
# in the past 500,000 years, likely followed by some sharp bottleneck.
# We selected as a representative Ne a value of 3500, which is also
# consistent with the average Ne inferred in the 2-epoch model of
# Robinson et al. (2022)
population_size=3500,
citations=[
stdpopsim.Citation(
author="Robinson et al.",
year=2022,
doi="https://doi.org/10.1126/science.abm1742",
reasons={stdpopsim.CiteReason.POP_SIZE},
),
stdpopsim.Citation(
author="Robinson et al.",
year=2022,
doi="https://doi.org/10.1126/science.abm1742",
reasons={stdpopsim.CiteReason.GEN_TIME},
),
stdpopsim.Citation(
author="Taylor et al.",
year=2007,
doi="https://aquadocs.org/handle/1834/41281",
reasons={stdpopsim.CiteReason.GEN_TIME},
),
],
)

stdpopsim.register_species(_species)

0 comments on commit bf0b81d

Please sign in to comment.