-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathChromosomeDistributionAB.py
114 lines (81 loc) · 2.41 KB
/
ChromosomeDistributionAB.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
#from matplotlib import *
#from pylab import *
import numpy
radius=17.2
interval=numpy.linspace(0,radius+2,100)
chr_arrayAA=numpy.zeros((46,len(interval)),dtype=numpy.float)
chr_arrayBB=numpy.zeros((46,len(interval)),dtype=numpy.float)
f=open('./../GM1.dat')
Atype=[]
Btype=[]
for line in f:
l=line.split()
if int(l[1])>=6:
Atype.append(int(l[0]))
Atype.append(int(l[0])+3043)
if int(l[1])==1:
Btype.append(int(l[0]))
Btype.append(int(l[0])+3043)
startPos=4001
endPos=10001+1
noOfFrame=0
a=[249,243,199,191,182,171,160,146,139,134,136,134,115,107,102,91,84,81,59,65,47,51,157]
size=a+a
csize=numpy.cumsum(size)
atoms=sum(size)
print "number of atoms",atoms
chromosome=numpy.zeros((atoms+1,3),dtype=numpy.float)
ABtype=numpy.zeros((atoms+1,1),dtype=numpy.int)
for filen in range(startPos,endPos,1):
noOfFrame+=1
name='my/file'+str(filen)+'.dat'
f=open(name)
cont=f.readlines()
print filen, "Time", cont[1][0:-1]
for i in range(5,len(cont)): ###8 check this line
l=cont[i].split()
if len(l)==6:
chromosome[int(l[0])]=[float(l[3]),float(l[4]),float(l[5])]
if int(l[0]) in Atype:
ABtype[int(l[0])]=1
start=1
for i in range(1,47):
for j in range(start,1+csize[i-1]):
dist=numpy.linalg.norm(chromosome[j])
for k in range(1,len(interval)):
if(dist>=interval[k-1])&(dist<interval[k]):
if ABtype[j]==1:
chr_arrayAA[i-1][k-1]+=1
else:
chr_arrayBB[i-1][k-1]+=1
start=1+csize[i-1]
binsize=interval[1]-interval[0]
xvec=[]
for i in range(len(interval)):
xvec.append(interval[i]/radius)
print "Number of frame", noOfFrame
for j in range(46):
for i in range(len(interval)):
chr_arrayAA[j][i]=chr_arrayAA[j][i]/float(noOfFrame)
chr_arrayBB[j][i]=chr_arrayBB[j][i]/float(noOfFrame)
for j in range(46):
sumAA=0.0
sumBB=0.0
for i in range(len(interval)):
sumAA+=(binsize*chr_arrayAA[j][i])
sumBB+=(binsize*chr_arrayBB[j][i])
for i in range(len(interval)):
chr_arrayAA[j][i]=radius*chr_arrayAA[j][i]/sumAA
chr_arrayBB[j][i]=radius*chr_arrayBB[j][i]/sumBB
fAA=open('chromosome_distributionAA.dat','w')
for j in range(len(interval)):
fAA.write(str(j+1)+'\t'+str(xvec[j])+'\t')
for i in range(46):
fAA.write(str(chr_arrayAA[i][j])+'\t')
fAA.write('\n')
fBB=open('chromosome_distributionBB.dat','w')
for j in range(len(interval)):
fBB.write(str(j+1)+'\t'+str(xvec[j])+'\t')
for i in range(46):
fBB.write(str(chr_arrayBB[i][j])+'\t')
fBB.write('\n')