main.py 15.2 KB
Newer Older
Stelios Karozis's avatar
Stelios Karozis committed
1
import os
Stelios Karozis's avatar
Stelios Karozis committed
2
import pandas as pd
Stelios Karozis's avatar
Stelios Karozis committed
3
import tooba_f as tbf
4
import tooba_gmx as tbgmx
Stelios Karozis's avatar
Stelios Karozis committed
5 6 7 8 9 10
###################################################
#NOTICE:    resids of head in each subdomain may differ in tail case
#           keep all atoms of group in the first occurent subdomain
#           in case of tail is the one closest to the head, hence
#           the code is a good approximation 
###################################################
11
SYSTEM_NAME='test'
Stelios Karozis's avatar
Stelios Karozis committed
12
DISCET=[3.5, 3.5, 3.5]
Stelios Karozis's avatar
Stelios Karozis committed
13
NUM_FR=2
14 15
TRAJ=SYSTEM_NAME+'/eq_traj.trr'
GRO=SYSTEM_NAME+'/eq_final.gro'
16
TPR=SYSTEM_NAME+'/eq_run.tpr'
17
#ITP_DIC={'NS':'CER_SOVOVA.itp','FFA':'FFA_CG.itp','CHOL':'CHOL_CG.itp'}
18 19 20 21 22 23
###################################################
# {NAME:[QUEUE OF PROCESSES]}
#
#   NAME: It is user defined. A dictionary must follows with the same name.
#         The dict structure has to be: {res_type:[atom_types]}
# 
24
#         if NAME is COMBINE then it needs part or all the info from aforementioned
25 26
#         groups to execute a process. You cannot use combination as first group.
#
27 28 29 30 31 32 33 34
#   QUEUE OF PROCESSES: surf, vector, tilt, index, density, gmx_ndx, [save, [type], save_name] 
#                                            
#                       surf:                       Determine surface from atoms (ex. Head of lipid)
#                       vector:                     Determine vector that fits atoms (ex. Tail of lipid)
#                       tilt:                       Use surf and vector result to calculate angle (if NAME is COMBINE)
#                       index:                      Creates unique code (md5) for every subdomain to use in data saving process 
#                       density:                    Detrmine density profile of x,y,z and save peaks of directions with the least number 
#                       gmx_ndx:                    Saves one ndx for every subdomain
35
#                       [save, [type], save_name]:  Save result of previous function, type: pkl, json
36 37
#
###################################################
38 39
GROUPS={'ALL':['gmx_ndx','index',['save', ['pkl'],'index'],'density',['save', ['pkl'],'dens']],
        'HD_GROUP':['surf',['save', ['pkl', 'json'],'time_domain_c-normal-cg']],
Stelios Karozis's avatar
Stelios Karozis committed
40
        'TL_GROUP':['vector',['save', ['pkl'],'vec']],
41
        'COMBINE':[['HD_GROUP','surf'],['TL_GROUP','vector'],['COMB','tilt'],['save', ['pkl'],'tilt']]
42
}
43
ALL={'NS':['C6', 'Na', 'P4', 'P3', 'C7','C3', 'C4', 'C5', 'C8', 'C9', 'C10'], 'CHOL':['ROH','R1', 'R2', 'R3', 'R4', 'R5'], 'FFA':['AC','C1', 'C2', 'C3', 'C4']}
Stelios Karozis's avatar
Stelios Karozis committed
44 45
HD_GROUP={'NS':['C6', 'Na', 'P4', 'P3', 'C7'], 'CHOL':['ROH'], 'FFA':['AC']}
TL_GROUP={'NS':['C3', 'C4', 'C5', 'C8', 'C9', 'C10'], 'CHOL':['R1', 'R2', 'R3', 'R4', 'R5'], 'FFA':['C1', 'C2', 'C3', 'C4']}
Stelios Karozis's avatar
Stelios Karozis committed
46
###################################################
Stelios Karozis's avatar
Stelios Karozis committed
47 48 49 50 51 52 53
###################################################
print(' ')
print('================')
print('Starting process')
print('================')
###################################################
###################################################
54
#Read .gro file
Stelios Karozis's avatar
Stelios Karozis committed
55
_,data_num,_,res_num,res_type,atom_type,atom_num,_ = tbf.read_gro(GRO)
Stelios Karozis's avatar
Stelios Karozis committed
56 57
print(' ')
###################################################
58
#--------------------------------------------------
Stelios Karozis's avatar
Stelios Karozis committed
59 60 61 62 63 64 65 66
#Count frames & calculate time of calculations
cnt_fr,time_index=tbf.count_frames(TRAJ,True)
MAX_FR=list(time_index.keys())[-1]
#print(MAX_FR,time_index[MAX_FR])
ST_FR=MAX_FR-NUM_FR
#print(ST_FR,time_index[ST_FR])
###################################################
#--------------------------------------------------
67 68 69 70 71 72 73 74
#Read .itp files
#weights={}
#for MOL in ITP_DIC.keys():
#    weights_tmp = tbf.read_itp(SYSTEM_NAME+'/'+ITP_DIC[MOL])
#    weights[MOL]=weights_tmp
#    print(' ')
#print(weights)
###################################################
75
#--------------------------------------------------
76
if os.path.isfile('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_data.pkl'):
Stelios Karozis's avatar
Stelios Karozis committed
77
    pass
Stelios Karozis's avatar
Stelios Karozis committed
78
else:
79 80 81
    #Read .trr file
    data_all=tbf.fr_export(trajfile=TRAJ,num_frames=NUM_FR)
    tbf.topickle(fl=data_all, sv_name='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_data')
Stelios Karozis's avatar
Stelios Karozis committed
82
    del data_all
Stelios Karozis's avatar
Stelios Karozis committed
83
###################################################
84 85 86 87
#--------------------------------------------------
#Check save files if exist in order to skip functions
prev=0
sv_index={}
88
for i in GROUPS.keys():
89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115
    for j in GROUPS[i]:
        try:
            sv_index[j]={}
            sv_index[j]['status']='not exist'
            sv_index[j]['name']='None'
        except TypeError:
            sv_index[str(j)]={}
            sv_index[str(j)]['status']='not exist'
            sv_index[str(j)]['name']='None'
        if len(j)==3:
            if j[0]=='save':
                for k in j[1]:
                    if k=='pkl':
                        if os.path.isfile('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_'+j[2]+'.pkl'):
                            sv_index[prev]['status']='exist'
                            sv_index[prev]['name']='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_'+j[2]+'.pkl'
                        else:
                            sv_index[prev]['status']='not exist'
                    if k=='json':    
                        if os.path.isfile('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_'+j[2]+'.pkl'):
                            sv_index[prev]['status']='exist'
                            sv_index[prev]['name']='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_'+j[2]+'.pkl'
                        else:
                            sv_index[prev]['status']='not exist'
        prev=str(j)
###################################################
#--------------------------------------------------
Stelios Karozis's avatar
Stelios Karozis committed
116
mrg_data={}
117 118
for i in GROUPS.keys():
#not COMBINE section
119 120
    if i!='COMBINE': 
        if os.path.isfile('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_ndx.pkl'):
Stelios Karozis's avatar
Stelios Karozis committed
121
            pass
122 123
        else:
            #Find atom type index in lists created above
124
            group_ndx=tbf.atomid_data(res_num, res_type, atom_type, atom_num, group=locals()[i])
125
            tbf.topickle(fl=group_ndx, sv_name='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_ndx')
Stelios Karozis's avatar
Stelios Karozis committed
126
            del group_ndx
127
#--------------------------------------------------
128
        if os.path.isfile('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_box.pkl'):
Stelios Karozis's avatar
Stelios Karozis committed
129
            pass            
130
        else:
Stelios Karozis's avatar
Stelios Karozis committed
131 132
            data_all=tbf.frompickle('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_data.pkl')
            group_ndx=tbf.frompickle('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_ndx.pkl')
133 134 135 136 137 138 139
            #Create subdomains coordinates
            box_p=tbf.domain_decomposition(data=data_all,dx=DISCET[0],dy=DISCET[1],dz=DISCET[2])
            #Assign desired atoms (from above function) to subdomains
            ##result1: {step:{res:{atom_type:{atom_num:(subX,subYsubZ)}}}}
            ##result2: {step:{res:{atom_type:{(subX,subYsubZ):[atom_num]}}}}
            _,box_res=tbf.atom2grid(data_all,box_p, group_ndx)
            tbf.topickle(fl=box_res, sv_name='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_box')
Stelios Karozis's avatar
Stelios Karozis committed
140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155
            del data_all
            del group_ndx
            del box_p
            del box_res
###################################################
        if os.path.isfile('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_FR'+str(NUM_FR)+'.pkl'):
            pass   
        else:
            #Creates dictionary with coordinates per subdomain for each frame
            data_all=tbf.frompickle('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_data.pkl')
            box_res=tbf.frompickle('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_box.pkl')
            _,coord_vector=tbf.sub_coord(box=box_res, data=data_all, res_num=res_num)
            tbf.topickle(fl=coord_vector, sv_name='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_FR'+str(NUM_FR))
            del data_all
            del box_res
            del coord_vector
156
###################################################
157 158
        for j in GROUPS[i]:
            if len(j) > 1:
159
                if j=='surf' and sv_index[j]['status']=='not exist':
Stelios Karozis's avatar
Stelios Karozis committed
160 161
                    if j not in locals():
                        surf={}
162
                    #Creates dictionary with c, normal per subdomain for each frame
Stelios Karozis's avatar
Stelios Karozis committed
163
                    coord_vector=tbf.frompickle('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_FR'+str(NUM_FR)+'.pkl')
164
                    surf[i]=tbf.coord2norm2cg(coord_vector,img=False)
Stelios Karozis's avatar
Stelios Karozis committed
165
                    del coord_vector
166 167
                    sv_data=surf[i]
                elif j=='surf' and sv_index[j]['status']=='exist':
168 169
                    if j not in locals():
                        surf={}
170 171 172 173 174
                    surf[i]=tbf.frompickle(sv_index[j]['name'])
#--------------------------------------------------   
                if j=='vector' and sv_index[j]['status']=='not exist':
                    if j not in locals():
                        vector={}
Stelios Karozis's avatar
Stelios Karozis committed
175
                    coord_vector=tbf.frompickle('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_FR'+str(NUM_FR)+'.pkl')
176
                    vector[i]=tbf.coord2vector(coord_vector)
Stelios Karozis's avatar
Stelios Karozis committed
177
                    del coord_vector
178 179 180
                    sv_data=vector[i]
                elif j=='vector' and sv_index[j]['status']=='exist':
                    if j not in locals():
181
                        vector={}
182 183 184
                    vector[i]=tbf.frompickle(sv_index[j]['name'])
#--------------------------------------------------
                if j=='index' and sv_index[j]['status']=='not exist':
185 186
                    uniq_id=tbgmx.ndx_index(SYSTEM_NAME)
                    sv_data=uniq_id
187 188 189 190
                elif j=='index' and sv_index[j]['status']=='exist':
                    uniq_id=tbf.frompickle(sv_index[j]['name'])
#--------------------------------------------------
                if j=='density' and sv_index[j]['status']=='not exist':
Stelios Karozis's avatar
Stelios Karozis committed
191
                    dens_dict={}
192
                    for iidd in uniq_id.keys():
Stelios Karozis's avatar
Stelios Karozis committed
193
                        dens_dict[iidd]={}
Stelios Karozis's avatar
Stelios Karozis committed
194
                        fl='./'+uniq_id[iidd]['system']+'/gmx_ndx/'+uniq_id[iidd]['ndx_file']                  
195 196
                        cnt=-1
                        for mol in locals()[i].keys():
Stelios Karozis's avatar
Stelios Karozis committed
197 198 199
                            ind=tbf.search_pattern(fl,mol)
                            if ind=='not exist':
                                break
200 201
                            cnt=cnt+1
                            for d in ('x','y','z'):
Stelios Karozis's avatar
Stelios Karozis committed
202
                                peaks = tbgmx.density_picks(TRR=TRAJ,TPR=TPR,IND=fl,SLC=400,ST=time_index[ST_FR],EN=-1,normal=d,fld='./'+uniq_id[iidd]['system'],arg=cnt,dist_pk=20)
203 204 205 206 207 208 209
                                if d=='x':
                                    tmp=peaks
                                else:
                                    print(len(tmp),len(peaks))
                                    if len(tmp)<len(peaks):
                                        peaks=tmp
                                    tmp=peaks
Stelios Karozis's avatar
Stelios Karozis committed
210 211 212 213 214
                            dens_nm=mol+'_dens'
                            dens_dict[iidd][dens_nm]=peaks
                        sv_data=dens_dict
                        mrg_data[j]=[dens_dict,[]]
                    del dens_dict
215
                elif j=='density' and sv_index[j]['status']=='exist':
Stelios Karozis's avatar
Stelios Karozis committed
216 217 218
                    dens_dict=tbf.frompickle(sv_index[j]['name'])
                    mrg_data[j]=[dens_dict,[]]
                    del dens_dict
219
#--------------------------------------------------
220
                if j=='gmx_ndx':
Stelios Karozis's avatar
Stelios Karozis committed
221
                    box_res=tbf.frompickle('./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_box.pkl')
222
                    tbf.togmxndx(box_res, fld='./'+SYSTEM_NAME, sv_name=SYSTEM_NAME+'_'+i)
223 224
#--------------------------------------------------
            # Save module
225 226
            if len(j)==3:
                if j[0]=='save':
227 228 229 230 231 232 233 234 235 236
                    try:
                        sv_data
                    except NameError:
                        pass
                    else:
                        for k in j[1]:
                            if k=='pkl':
                                tbf.topickle(fl=sv_data, sv_name='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_'+j[2])
                            if k=='json':    
                                tbf.tojson(fl=sv_data, sv_name='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_'+j[2])
Stelios Karozis's avatar
Stelios Karozis committed
237
###################################################
238
#COMBINE section
239 240
    else:
        for j in GROUPS[i]:
241 242 243 244
            #Input to COMBINE property
            if j[0]!='COMB':
                if j[1]=='surf':
                    surf=surf[j[0]]
Stelios Karozis's avatar
Stelios Karozis committed
245
                    #del surf[j[0]]
246 247
                if j[1]=='vector':
                    vector=vector[j[0]]
Stelios Karozis's avatar
Stelios Karozis committed
248
                    #del vector[j[0]]
249 250 251 252
            #Calculate COMBINE property
            if j[0]=='COMB':
                if j[1]=='tilt' and sv_index[str(j)]['status']=='not exist':
                    tilt=tbf.SurfVector_angle(surf,vector)
Stelios Karozis's avatar
Stelios Karozis committed
253 254
                    del surf
                    del vector
255 256 257
                    #Loop over timesteps and keep avgs tilts for each step
                    avg={}
                    for step in tilt.keys():
Stelios Karozis's avatar
Stelios Karozis committed
258
                        ss=[]
259 260 261 262 263 264 265
                        for sub in tilt[step].keys():
                            avgs=tilt[step][sub]['avg/frame']
                            if sub not in ss:
                                ss.append(sub)
                                avg[sub]=avgs
                            else:
                                avg[sub].append(avgs)
Stelios Karozis's avatar
Stelios Karozis committed
266
                    del tilt
267 268 269 270 271 272 273 274 275 276 277 278
                    #Calculate total average 
                    tot_avg={}
                    for sub in avg.keys():
                        for key, value in uniq_id.items():
                            if str(value['domain']).strip() == str(sub).strip():
                                hsh=key
                                break
                        try:
                            tot_avg[hsh]=sum(avg[sub])/len(avg[sub])
                        except TypeError: #in case of one frame
                            tot_avg[hsh]=sum([avg[sub]])/len([avg[sub]])
                    sv_data=tot_avg
Stelios Karozis's avatar
Stelios Karozis committed
279 280
                    mrg_data[j[1]]=[tot_avg,['Tilt[degrees]']]
                    del tot_avg
281 282
                elif j[1]=='tilt' and sv_index[str(j)]['status']=='exist':
                    tot_avg=tbf.frompickle(sv_index[str(j)]['name'])
Stelios Karozis's avatar
Stelios Karozis committed
283 284
                    mrg_data[j[1]]=[tot_avg,['Tilt[degrees]']]
                    del tot_avg
285 286 287 288 289 290 291 292 293 294 295 296 297 298 299
#--------------------------------------------------
            # Save module
            if len(j)==3:
                if j[0]=='save':
                    try:
                        sv_data
                    except NameError:
                        pass
                    else:
                        for k in j[1]:
                            if k=='pkl':
                                tbf.topickle(fl=sv_data, sv_name='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_'+j[2])
                            if k=='json':    
                                tbf.tojson(fl=sv_data, sv_name='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_'+i+'_'+j[2])             
###################################################
Stelios Karozis's avatar
Stelios Karozis committed
300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316
#Merge data
tbf.topickle(fl=mrg_data, sv_name='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_merge')
print(' ')
print('Merging data of:')
print('==============================')
for tp in mrg_data.keys():
    if len(mrg_data[tp][1])!=0:
        df=pd.DataFrame.from_dict(mrg_data[tp][0], orient='index',columns=mrg_data[tp][1])
    else:
        df=pd.DataFrame.from_dict(mrg_data[tp][0], orient='index')
    try:
        data_df=data_df.join(df)
    except:
        data_df=df.copy()
        continue
tbf.topickle(fl=data_df, sv_name='./'+SYSTEM_NAME+'/'+SYSTEM_NAME+'_dataset')
###################################################
317
###################################################