1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
extern crate getopts;
extern crate fasten;
extern crate regex;
extern crate rand;
use std::fs::File;
use std::io::BufReader;
use std::io::BufRead;
use std::env;
use rand::distributions::{IndependentSample, Range};
use fasten::fasten_base_options;
use fasten::logmsg;
fn main(){
let args: Vec<String> = env::args().collect();
let mut opts = fasten_base_options();
opts.optopt("s", "snps", "Number of SNPs (point mutations) to include per read.", "INT");
opts.optflag("m", "mark", "lowercase all reads but uppercase the SNPs (not yet implemented)");
let matches = opts.parse(&args[1..]).expect("ERROR: could not parse parameters");
if matches.opt_present("help") {
println!("Mutates reads. There is no mutation model; only randomness.\n{}", opts.usage(&opts.short_usage(&args[0])));
std::process::exit(0);
}
if matches.opt_present("paired-end") {
logmsg("WARNING: --paired-end is not utilized in this script");
}
let num_snps:u8 = if matches.opt_present("snps") {
matches.opt_str("snps").unwrap()
.parse().expect("--snps needs to be a FLOAT")
} else {
panic!("ERROR: --snps is required")
};
let mark:bool = if matches.opt_present("mark"){
true
} else {
false
};
let nts = vec!['A', 'C', 'G', 'T'];
let my_file = File::open("/dev/stdin").expect("Could not open file");
let my_buffer=BufReader::new(my_file);
let mut buffer_iter = my_buffer.lines();
while let Some(line) = buffer_iter.next() {
let id = line.expect("ERROR reading the ID line");
let seq = buffer_iter.next().expect("ERROR reading a sequence line")
.expect("ERROR reading a sequence line");
buffer_iter.next().expect("ERROR reading a plus line")
.expect("ERROR reading the plus line");
let qual= buffer_iter.next().expect("ERROR reading a qual line")
.expect("ERROR reading a qual line");
let new_seq = mutate(&seq, &nts, num_snps, mark);
println!("{}\n{}\n+\n{}",id,new_seq,qual);
}
}
fn mutate(seq: &str, nts: &Vec<char>, num_snps: u8, mark:bool) -> String {
let mut sequence:Vec<u8> = seq.as_bytes().to_vec();
if mark {
sequence.make_ascii_lowercase();
}
let length = sequence.len();
let between = Range::new(0, length);
let nt_range= Range::new(0, nts.len());
let mut rng = rand::thread_rng();
for _ in 0..num_snps {
let pos = between.ind_sample(&mut rng);
let nt = nts[nt_range.ind_sample(&mut rng)];
sequence[pos] = nt as u8;
}
return String::from_utf8_lossy(&sequence).to_string();
}