-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathMapping_genes.R
52 lines (40 loc) · 1.9 KB
/
Mapping_genes.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
## Mapping the intersecting SNPs/genes in the EMMAX to the annotated IBC chip
library(Hmisc)
setwd("Z:/Project/Framingham/Data/Phenotype/FHS49K_lifespan&weight")
## load snps/gene lists to be mapped for their SNPs/genes in the annotation of IBC49K chip
lr_e_f = read.csv("LR_emmax_F.csv",as.is=TRUE)
lr_e_m = read.csv("LR_emmax_M.csv",as.is=TRUE)
## load snp-gene mapping table
mapping.ibc = read.csv('IBC_chip_final_49K SNP_list_BroadInst.csv', as.is = TRUE)
# describe(mydata) like describe(mapping) to explore the datasheet
## set up the new snp-gene mapping table
intersect_emmax_gene_1 = lr_e_f
for (i in 5) intersect_emmax_gene_1[, i] = NA
names(intersect_emmax_gene_1)[5] = c('IBC_gene')
### intersect_emmax_gene_1 = lr_e_f
### intersect_emmax_gene_1[, 5] = NA
### names(intersect_emmax_gene_1)[5] = c('IBC_gene')
intersect_emmax_gene_2 = lr_e_m
for (i in 5) intersect_emmax_gene_2[, i] = NA
names(intersect_emmax_gene_2)[5] = c('IBC_gene')
### intersect_emmax_gene_2 = lr_e_m
### intersect_emmax_gene_2[, 5] = NA
### names(intersect_emmax_gene_2)[5] = c('IBC_gene')
## looking for the corresponding gene for each SNP
for (i in 1L:nrow(intersect_emmax_gene_1)) {
print(i)
for (j in 1L:nrow(mapping.ibc)) {
if (intersect_emmax_gene_1$rs_num[i] %in% mapping.ibc$SNP_ID[j])
intersect_emmax_gene_1[i, 'IBC_gene'] = paste(na.omit(c(intersect_emmax_gene_1[i, 'IBC_gene'], mapping.ibc$RefSeq_hg18_Gene[j])), collapse = ',')
}
}
for (i in 1L:nrow(intersect_emmax_gene_2)) {
print(i)
for (j in 1L:nrow(mapping.ibc)) {
if (intersect_emmax_gene_2$rs_num[i] %in% mapping.ibc$SNP_ID[j])
intersect_emmax_gene_2[i, 'IBC_gene'] = paste(na.omit(c(intersect_emmax_gene_2[i, 'IBC_gene'], mapping.ibc$RefSeq_hg18_Gene[j])), collapse = ',')
}
}
## write candidate snps in csv format
write.csv(intersect_emmax_gene_1, file = 'LR_Emmax_F_ibc.csv')
write.csv(intersect_emmax_gene_2, file = 'LR_Emmax_M_ibc.csv')