forked from jmcole003/SDS_humans
-
Notifications
You must be signed in to change notification settings - Fork 0
/
calc_boot_viability.R
68 lines (56 loc) · 2.15 KB
/
calc_boot_viability.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
# Bootstrapping for UKB haplotype data
# SAS viability
# updated - 2/8/24
#Remove scientific notation
#options(scipen = 999)
options(warn=1)
#Argument, libraries, and settings
suppressMessages(library("optparse")) #load opt parser library
suppressMessages(library("dplyr"))
suppressMessages(library("data.table"))
option_list = list(
make_option(c("-f", "--file"), type="character", default=NULL,
help="haplotype counts file", metavar="character"),
make_option(c("-w", "--windowsize"), type="character", default=2,
help="window size [default= %default]", metavar="numeric"),
make_option(c("-b", "--bootreps"), type="character", default=100,
help="bootstrap samples [default= %default]", metavar="numeric"),
make_option(c("-p", "--pxhat"), type="character", default=0.2,
help="assumed minor allele frequency at site x [default= %default]",
metavar="numeric"),
make_option(c("-o", "--output"), type="character", default=NULL,
help="output file name", metavar="character")
);
opt_parser = OptionParser(option_list=option_list);
opt = parse_args(opt_parser);
if (is.null(opt$file)){
print_help(opt_parser)
stop("At least one argument must be supplied (input haplotype file).n",
call.=FALSE)
}
if (is.null(opt$output)){
print_help(opt_parser)
stop("At least one argument must be supplied (output file name).n",
call.=FALSE)
}
### Import functions
source('/scratch/ukb/scripts/ML_functions.R')
#input haplotype counts
haplotype_counts <- fread(opt$file, sep="\t", header = TRUE,
check.names=FALSE)
#Window size
win <- as.numeric(opt$windowsize)
#px_hat
pxhat <- as.numeric(opt$pxhat)
# Bootstrap
boots = vector("list", length = as.numeric(opt$bootreps))
for (i in 1:as.numeric(opt$bootreps)) {
bt_counts <- bootstrap.v(haplotype_counts, pxhat = pxhat)
bt_counts$bootrep <- i
bt_counts[order(bt_counts$Window),] -> bt_counts
boots[[i]] <- bt_counts
}
boots = do.call(rbind, boots)
#output
write.table(boots, paste0(opt$output, ".v.boot"), sep="\t",
row.names = FALSE, quote = FALSE)