-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathprepareChrSequences.py
50 lines (35 loc) · 1.07 KB
/
prepareChrSequences.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
##################################
## ##
## prepareChrSequences.py ##
## ##
##################################
#
# Purpose: preparing all the chromosome sequences
#
#
# Inputs:
# - one .fa file for each chromosome
#
#
# Output:
# - one file with all the sequences, one chromosome per line
#
from time import localtime, strftime, sleep
dir = "./mm10_input/chr_sequences/"
chromosomes = ["1", "2", "3", "4", "5", "6", "7", "8", "9", "10", "11", "12", "13", "14", "15", "16", "17", "18", "19", "M", "X", "Y"]
outFile = open(dir+"all_sequences.txt",'w')
for c in chromosomes:
chr = "chr"+c+".fa"
print strftime("%H:%M:%S", localtime())+": "+chr[:-3]
inFile = open(dir+chr,'r')
lines = inFile.readlines()
for i in range(1,len(lines)):
outFile.write(lines[i].rstrip())
outFile.write("\n")
outFile.close()
print strftime("%H:%M:%S", localtime())+": Done."
#######################
## ##
## End of File ##
## ##
#######################