Skip to content

Commit

Permalink
Make genome length a const generic
Browse files Browse the repository at this point in the history
  • Loading branch information
arcresu committed Jun 9, 2023
1 parent 6a737f3 commit 69f6eda
Show file tree
Hide file tree
Showing 8 changed files with 56 additions and 32 deletions.
2 changes: 1 addition & 1 deletion examples/binned.rs
Original file line number Diff line number Diff line change
Expand Up @@ -32,7 +32,7 @@ fn main() -> Result<()> {
// use this instead for reproducible simulation:
// let rng = Xoshiro256PlusPlus::seed_from_u64(32189661_u64);

let genome = SimpleGenome::default();
let genome = SimpleGenome::<64>::default();
let ob = binned_outbreaks(genome, &disease_model, mutation_rate, &binned_cfg, rng)?;

let stdout = std::io::stdout();
Expand Down
10 changes: 8 additions & 2 deletions examples/combined.rs
Original file line number Diff line number Diff line change
Expand Up @@ -27,8 +27,14 @@ fn main() -> Result<()> {
// let mut rng = Xoshiro256PlusPlus::seed_from_u64(32189661_u64);

// simulate an initial outbreak
let index1 = SimpleGenome::default();
let mut ob = simulate_outbreak(index1, &disease_model, mutation_rate, max_cases, &mut rng)?;
let index1 = SimpleGenome::<64>::default();
let mut ob = simulate_outbreak(
index1.clone(),
&disease_model,
mutation_rate,
max_cases,
&mut rng,
)?;

// create a second outbreak from a new introduction of the disease 30 time steps later with 10
// SNPs separating it from the original index genome
Expand Down
2 changes: 1 addition & 1 deletion examples/simple.rs
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ fn main() -> Result<()> {
// use this instead for reproducible simulation:
// let mut rng = Xoshiro256PlusPlus::seed_from_u64(9948901_u64);

let genome = SimpleGenome::default();
let genome = SimpleGenome::<256>::default();
let ob = simulate_outbreak(genome, &disease_model, mutation_rate, max_cases, &mut rng)?;

let stdout = std::io::stdout();
Expand Down
49 changes: 28 additions & 21 deletions src/genome/simple.rs
Original file line number Diff line number Diff line change
Expand Up @@ -6,33 +6,37 @@ use std::convert::TryInto;
use std::fmt;
use std::io;

/// number of distinct sites on the genome that can be represented.
pub const GENOME_LENGTH: usize = 64;
pub type GenomeStorage = BitArr!(for GENOME_LENGTH, in u64);
type GenomeStorage = BitBox<usize, Lsb0>;

/// Representation of a genome.
///
/// Internally this is represented as a vector of binary bits. Mutation is modelled by
/// Internally this is represented as an array of binary bits. Mutation is modelled by
/// selecting bits uniformly at random and flipping them.
///
/// This model enables efficient operations and compact storage.
#[derive(PartialEq, Eq, Clone, Copy, Default)]
pub struct SimpleGenome(GenomeStorage);
#[derive(PartialEq, Eq, Clone)]
pub struct SimpleGenome<const BP: usize>(GenomeStorage);

impl Genome for SimpleGenome {
impl<const BP: usize> Default for SimpleGenome<BP> {
fn default() -> Self {
SimpleGenome(bitbox![usize, Lsb0; 0; BP])
}
}

impl<const BP: usize> Genome for SimpleGenome<BP> {
/// Flip exactly `n_mutations` bits chosen at random.
///
/// Panics if the requested number of mutations is greater than the fixed width of the
/// representation.
fn mutate<R: Rng>(&self, n_mutations: usize, mut rng: R) -> Self {
let mut new_genome = self.0;
assert!(
n_mutations <= GENOME_LENGTH,
n_mutations <= BP,
"Requested number of mutations ({}) exceeds width of genome representation ({})",
n_mutations,
GENOME_LENGTH
BP
);
for pos in index::sample(&mut rng, GENOME_LENGTH, n_mutations) {
let mut new_genome = self.0.clone();
for pos in index::sample(&mut rng, BP, n_mutations) {
let val = !new_genome.get(pos).unwrap();
new_genome.set(pos, val);
}
Expand All @@ -41,23 +45,26 @@ impl Genome for SimpleGenome {

/// Counts the bitwise differences between the genome representations.
fn snps(&self, other: &Self) -> u32 {
(self.0 ^ other.0).count_ones().try_into().unwrap()
(self.0.clone() ^ other.0.clone())
.count_ones()
.try_into()
.unwrap()
}

/// Relabels 1 and 0 as A and C respectively.
fn write_nucleotides<W: io::Write>(&self, mut writer: W) -> io::Result<()> {
for base in self.0 {
write!(writer, "{}", if base { 'A' } else { 'C' })?;
for base in self.0.as_bitslice() {
write!(writer, "{}", if *base { 'A' } else { 'C' })?;
}
Ok(())
}
}

impl fmt::Debug for SimpleGenome {
impl<const BP: usize> fmt::Debug for SimpleGenome<BP> {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
write!(f, "SimpleGenome(")?;
for base in self.0 {
write!(f, "{}", if base { 'A' } else { 'C' })?;
for base in self.0.as_bitslice() {
write!(f, "{}", if *base { 'A' } else { 'C' })?;
}
write!(f, ")")
}
Expand All @@ -71,22 +78,22 @@ mod tests {

#[test]
fn test_empty() {
let genome1 = SimpleGenome::default();
let genome2 = SimpleGenome::default();
let genome1 = SimpleGenome::<64>::default();
let genome2 = SimpleGenome::<64>::default();
assert_eq!(genome1.snps(&genome2), 0);
}

#[test]
fn test_mutation() {
let mut rng = Xoshiro256PlusPlus::seed_from_u64(89324 as u64);
let genome = SimpleGenome::default();
let genome = SimpleGenome::<64>::default();
assert_ne!(genome, genome.mutate(4, &mut rng));
}

#[test]
fn test_distance() {
let mut rng = Xoshiro256PlusPlus::seed_from_u64(89324 as u64);
let genome = SimpleGenome::default();
let genome = SimpleGenome::<64>::default();
let child = genome.mutate(5, &mut rng);
assert_eq!(genome.snps(&child), 5);
assert_eq!(child.snps(&genome), 5);
Expand Down
4 changes: 2 additions & 2 deletions src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -28,7 +28,7 @@
//! // stop the simulation at the end of a time step where the case count exceeds 100
//! let max_cases = 100;
//!
//! let genome = SimpleGenome::default();
//! let genome = SimpleGenome::<64>::default();
//! let ob = simulate_outbreak(genome, &disease_model, mutation_rate, max_cases, &mut rng);
//! assert!(ob.is_ok());
//!
Expand Down Expand Up @@ -60,7 +60,7 @@ pub mod simple {
//! and can be configured to match details of a pathogen of interest.
pub use crate::disease::simple::SimpleDisease;
pub use crate::genome::simple::{GenomeStorage, SimpleGenome, GENOME_LENGTH};
pub use crate::genome::simple::SimpleGenome;
}

pub use disease::covid;
2 changes: 1 addition & 1 deletion src/simulate/binned.rs
Original file line number Diff line number Diff line change
Expand Up @@ -272,7 +272,7 @@ mod tests {
bad_simulation_cap: 2000,
};
let mut rng = Xoshiro256PlusPlus::seed_from_u64(89324 as u64);
let genome = SimpleGenome::default();
let genome = SimpleGenome::<64>::default();
let outbreaks = binned_outbreaks(genome, &dm, mutation_rate, &sim_cfg, &mut rng).unwrap();

assert_eq!(
Expand Down
2 changes: 1 addition & 1 deletion src/simulate/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -140,7 +140,7 @@ mod tests {
infectiousness: vec![0.34, 0.33, 0.33],
};
let mutation_rate = 2e-4 / 365.;
let genome = SimpleGenome::default();
let genome = SimpleGenome::<64>::default();
let outbreak = simulate_outbreak(genome, &dm, mutation_rate, 100, &mut rng);

assert!(outbreak.is_ok());
Expand Down
17 changes: 14 additions & 3 deletions src/simulate/outbreak.rs
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,8 @@ use crate::genome::Genome;
use crate::{Count, Time};
use std::io;

const FASTA_N_COLS: usize = 70;

/// A simulated outbreak containing a number of cases.
#[derive(Debug)]
pub struct Outbreak<G> {
Expand Down Expand Up @@ -49,20 +51,29 @@ impl<G: Genome> Outbreak<G> {
pub fn write_fasta<W: io::Write>(&self, mut writer: W) -> io::Result<()> {
let sources = self.outbreaks();

let mut sequence = Vec::<u8>::new();
for (i, genome) in self.genome.iter().enumerate() {
writeln!(
writer,
">case{:06} day_infected={} day_reported={} outbreak={} parent={}",
i,
self.history[i].infected,
self.history[i].infected,
self.history[i]
.reported
.map(|x| x.to_string())
.unwrap_or("".to_string()),
sources[i],
self.source[i]
.map(|x| format!("case{:06}", x))
.unwrap_or_else(String::new)
)?;
genome.write_nucleotides(&mut writer)?;
writeln!(writer)?;

genome.write_nucleotides(&mut sequence)?;
for chunk in sequence.chunks(FASTA_N_COLS) {
writer.write_all(chunk)?;
writeln!(writer)?;
}
sequence.clear();
}
Ok(())
}
Expand Down

0 comments on commit 69f6eda

Please sign in to comment.