-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathFasta_Parser.py
More file actions
50 lines (36 loc) · 1.36 KB
/
Fasta_Parser.py
File metadata and controls
50 lines (36 loc) · 1.36 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
###@author Feng Ju
###@email fengju@westlake.edu.cn
print 'This script is written for parsing Large Fasta file into small sub-fastas!'
import os
import time, sys
Parameters=raw_input("Enter two parameters: [Fastaname],[NUM](*10000)(number of sequences in each sub-fasta), sepeated by Space: ")
while True:
try:
filename=Parameters.split(' ')[0]
Num=Parameters.split(' ')[1]
num=int(float(Num)*10000)
break
except:
Parameters=raw_input("Enter two parameters: [Fastaname],[NUM](*10000)(number of sequences in each sub-fasta), sepeated by Space: ")
start=time.time() # Timing begins
wrerr = sys.stderr.write
if os.path.exists(filename+'_divided'):
for root, dirs, files in os.walk(filename+'_divided'):
for name in files:
os.remove(os.path.join(root,name))
else:
os.mkdir(filename+'_divided')
j=-1
f=open(filename+'_divided\\'+filename.replace('.fasta','')+'-1.fasta','w')
for line in open(filename,'r'):
if '>' in line:
j+=1
if j%int(num)==0 and j!=0:
f=open(filename+'_divided\\'+filename.replace('.fasta','')+'-'+str(1+j/int(num))+'.fasta','a')
f.write(line)
else:
f.write(line)
f.close()
end=time.time() # Timing ends
wrerr("OK, work finished in %3.2f secs\n" % (end-start))
f.close()