Skip to content

Commit

Permalink
Add script to make DCD trajectories for each cluster.
Browse files Browse the repository at this point in the history
In an effort to make IMP trajectories available in a
more or less standard binary trajectory format (other than
our own RMF format) add a script to convert the set of RMF
files (output from PMI's clustering) stored here into
CHARMM/NAMD DCD files. Relates salilab/imp#964.
  • Loading branch information
benmwebb committed May 22, 2017
1 parent 9baacf4 commit ae2b775
Showing 1 changed file with 91 additions and 0 deletions.
91 changes: 91 additions & 0 deletions Rrp6.analysis/kmeans_weight_500_2/to_dcd.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,91 @@
#!/usr/bin/env python

"""This is a simple script to convert an IMP cluster (multiple single-frame
RMF files) into DCD (CHARMM/NAMD) trajectories, with each bead or residue
represented as a single 'atom', in residue number order (the same order
as in the mmCIF file).
We use the updated version of MDTools that's bundled with Chimera, so you
may need to change sys.path accordingly, below.
"""

from __future__ import print_function
import os
import ast
import sys
sys.path.append('/opt/chimera-1.11-1.fc24/share/Trajectory/DCD/MDToolsMarch97/')
import md
import IMP.pmi.output
import IMP.rmf
import RMF

class IMPCluster(object):
def __init__(self, directory):
self.directory = directory

def get_size(self):
"""Get number of models in the cluster"""
fname = os.path.join(self.directory, 'stat.out')
n_models = 0
with open(fname) as fh:
for line in fh:
n_models += 1
return n_models

def get_rmf_file(self, model_num):
"""Get path to RMF file for the given model in the cluster"""
return os.path.join(self.directory, '%d.rmf3' % model_num)


class DCDOutput(object):
"""Dump a series of IMP Hierarchies to a DCD file."""

def __init__(self, fname):
self.fname = fname
self._d = None

def dump(self, mhs):
coords = self._get_coords(mhs)
if self._d is None:
self._init_dcd(len(coords))
assert(len(coords) == len(self._ag.atoms))
for i, coord in enumerate(coords):
# Everything should be non-atomic for now
assert(coord[1] is None)
a = self._ag.atoms[i]
a.x, a.y, a.z = coord[0]
self._d.append()

def _init_dcd(self, n_coords):
self._ag = md.AtomGroup()
for i in range(n_coords):
self._ag.atoms.append(md.Atom())
self._d = md.DCDWrite(self.fname, self._ag)

def _get_coords(self, mhs):
assert(len(mhs) == 1)
o = IMP.pmi.output.Output(atomistic=True)
name = 'dcd-output'
o.dictionary_pdbs[name] = mhs[0]
o._init_dictchain(name, mhs[0])
coords, geometric_center = o.get_particle_infos_for_pdb_writing(name)
return coords


if len(sys.argv) != 3:
print("Usage: %s [cluster directory] [output DCD file]" % sys.argv[0],
file=sys.stderr)
sys.exit(1)

d = DCDOutput(sys.argv[2])
cluster = IMPCluster(sys.argv[1])

cluster_size = cluster.get_size()
for i in range(cluster_size):
m = IMP.Model()
r = RMF.open_rmf_file_read_only(cluster.get_rmf_file(i))
mhs = IMP.rmf.create_hierarchies(r, m)
# Make sure rigid body coordinates are up to date
m.update()
print("Adding coordinates for model %d of %d" % (i + 1, cluster_size))
d.dump(mhs)

0 comments on commit ae2b775

Please sign in to comment.