Mutate Rasidue Pdb

RCSB PDB is hosted by RCSB PDB is a member of the RCSB PDB is funded by the National Science Foundation (DBI-1832184), the National Institutes of Health, and the US Department of Energy (DE-SC0019749). C library to mutate pdb residues. The source code for this command is written in C and exposes a TCL interface, so chances are that you can adapt it to your needs. Keep in mind, though, that after you mutate the residue you may need to do a short equilibration run.

Permalink

Join GitHub today

GitHub is home to over 36 million developers working together to host and review code, manage projects, and build software together.

Find file Copy path

53aa41aApr 10, 2019

2 contributors

import os

import sys

import math

import subprocess

from itertools import chain

import argparse

import parmed

try:

from cStringIO import StringIO

exceptImportError:

from io import StringIO

from .leap_runner import _make_leap_template

from .utils import easy_call

import logging

logger = logging.getLogger('pdb4amber_log')

logger.setLevel(logging.DEBUG)

PY3= sys.version_info[0] 3

ifPY3:

string_types =str

else:

string_types =basestring

#TODO: include in ParmEd?

from .residue import (

RESPROT,

AMBER_SUPPORTED_RESNAMES,

HEAVY_ATOM_DICT, )

from .utils import tempfolder, amberbin

__version__='1.6.dev'

classAmberPDBFixer(object):

'' Base class (?) for handling pdb4amber (try to mimic

original code)

Parameters

----------

parm : str or parmed.Structure or None, default None

def__init__(self, parm=None):

#TODO: make a copy?

# Why not now? parm[:] will not correctly assign TER residue

# self.parm = parm[:]

ifisinstance(parm, string_types):

self.parm = parmed.load_file(parm)

elif parm isNone:

self.parm = parmed.Structure()

else:

self.parm = parm

defmutate(self, mask_list):

#TODO : same syntax as pdbfixer (openmm)?

Parameters

----------

mask_list: List[Tuple[int, str]]

[(1, 'ARG'),]

Notes

-----

Should also use `add_hydrogen` and `add_missing_atoms`

idxs = []

for (idx, resname) in mask_list:

self.parm.residues[idx].name = resname

idxs.append(str(idx +1))

excluded_mask =':'+','.join(idxs) +'&!@C,CA,N,O'

self.parm.strip(excluded_mask)

returnself

defpack(self, mol, n_copies, ig=8888, grid_spacing=0.2):

'' add n_copies of mol to AmberPDBFixer

Parameters

----------

mol : parmed.Structure

n_copies : number of `mol`

ig : int

randome seed

grid_spacing : float

Requires

--------

AddToBox program

add_to_box_exe = amberbin('AddToBox') or'AddToBox'

input_pdb ='input.pdb'

mol_pdb ='mol.pdb'

out_pdb ='out.pdb'

with tempfolder():

mol.save(mol_pdb, overwrite=True)

self.parm.save(input_pdb, overwrite=True)

command = [

add_to_box_exe, '-c', input_pdb, '-a', mol_pdb, '-na',

str(n_copies), '-IG', str(ig), '-G', str(grid_spacing), '-o',

out_pdb

]

easy_call(command)

self.parm = parmed.load_file(out_pdb)

returnself

defassign_histidine(self):

'' Assign correct name for Histidine based on the atom name

Returns

-------

parm : updated `parm`

amber_his_names =set(['HID', 'HIE', 'HIP'])

possible_names =set([

'HIS',

]) | amber_his_names

for residue inself.parm.residues:

if residue.name in possible_names:

atom_name_set =sorted(

set(atom.name for atom in residue.atoms

if atom.atomic_number 1))

ifset(['HD1', 'HE2']).issubset(atom_name_set):

residue.name ='HIP'

elif'HD1'in atom_name_set:

residue.name ='HID'

elif'HE2'in atom_name_set:

residue.name ='HIE'

returnself

defstrip(self, mask):

self.parm.strip(mask)

returnself

deffind_missing_heavy_atoms(self, heavy_atom_dict=HEAVY_ATOM_DICT):

residue_collection = []

for residue inself.parm.residues:

if residue.name in heavy_atom_dict:

n_heavy_atoms =len(

set(atom.name for atom in residue.atoms

if atom.atomic_number !=1))

n_missing = heavy_atom_dict[residue.name] - n_heavy_atoms

if n_missing >0:

residue_collection.append([residue, n_missing])

return residue_collection

defadd_missing_atoms(self):

in_pdb ='in.pdb'

out_pdb ='out.pdb'

with tempfolder():

self.write_pdb(in_pdb)

withopen('leap.in', 'w') as fh:

fh.write('source leaprc.protein.ff14SBn')

fh.write('source leaprc.DNA.bsc1n')

fh.write('source leaprc.RNA.OL3n')

fh.write('x = loadpdb {}n'.format(in_pdb))

fh.write('savepdb x {}n'.format(out_pdb))

fh.write('quit')

easy_call('tleap -f leap.in', shell=True)

self.parm = parmed.load_file(out_pdb)

returnself

defconstph(self):

'' Update AS4, GL4, HIP for constph.

Returns

-------

parm : updated `parm`

for residue inself.parm.residues:

if residue.name 'ASP':

residue.name ='AS4'

elif residue.name 'GLU':

residue.name ='GL4'

elif residue.name 'HIS':

residue.name ='HIP'

else:

pass

returnself

deffind_non_protein_residues(self):

returnset(res.name for res inself.parm.residues if res.name notinRESPROT)

deffind_gaps(self):

#TODO: doc

# report original resnum?

CA_atoms= []

C_atoms = []

N_atoms = []

gaplist = []

parm =self.parm

# N.B.: following only finds gaps in protein chains!

# H.N: Assume that residue has all 3 atoms: CA, C, and N

respro_nocap =set(RESPROT) - {'ACE', 'NME'}

for i, atom inenumerate(parm.atoms):

#TODO: if using 'CH3', this will be failed with

# ACE ALA ALA ALA NME system

# if atom.name in ['CA', 'CH3'] and atom.residue.name in RESPROT:

if atom.name in [

'CA',

] and atom.residue.name in respro_nocap:

CA_atoms.append(i)

if atom.name 'C'and atom.residue.name in respro_nocap:

C_atoms.append(i)

if atom.name 'N'and atom.residue.name in respro_nocap:

N_atoms.append(i)

nca =len(CA_atoms)

ngaps =0

for i inrange(nca -1):

is_ter = parm.atoms[CA_atoms[i]].residue.ter

if is_ter:

continue

# Changed here to look at the C-N peptide bond distance:

C_atom = parm.atoms[C_atoms[i]]

N_atom = parm.atoms[N_atoms[i +1]]

dx =float(C_atom.xx) -float(N_atom.xx)

dy =float(C_atom.xy) -float(N_atom.xy)

dz =float(C_atom.xz) -float(N_atom.xz)

gap = math.sqrt(dx * dx + dy * dy + dz * dz)

if gap >2.0:

gaprecord = (gap, C_atom.residue.name, C_atom.residue.idx,

N_atom.residue.name, N_atom.residue.idx)

gaplist.append(gaprecord)

ngaps +=1

if ngaps >0:

logger.info('n---------- Gaps (Renumbered Residues!)')

cformat ='gap of %lf A between %s%d and %s%d'

for _, (d, resname0, resid0, resname1,

resid1) inenumerate(gaplist):

# convert to 1-based

logger.info(cformat % (d, resname0, resid0 +1, resname1,

resid1 +1))

return gaplist

deffind_disulfide(self):

'' return set of cys-cys pairs

Returns

-------

cys_cys_set : Set[List[int, int]]

residues = [

res for res inself.parm.residues if res.name in ['CYS', 'CYX', 'CYM']

]

cys_cys_resid_set =set()

cys_cys_atomidx_set =set()

for residue in residues:

for atom in residue.atoms:

if'SG'in atom.name:

for partner in atom.bond_partners:

if (partner.residue.name.startswith('CY') and

partner.name.startswith('SG')):

# use tuple for hashing

cys_cys_resid_set.add(

tuple(

sorted((atom.residue.idx,

partner.residue.idx))))

cys_cys_atomidx_set.add(

tuple(sorted((atom.idx, partner.idx))))

returnsorted(cys_cys_resid_set), sorted(cys_cys_atomidx_set)

defrename_cys_to_cyx(self, cys_cys_set):

'' Rename CYS to CYX of having S-S bond.

Parameters

----------

cys_cys_set : Set[List[int, int]]

for index in chain.from_iterable(cys_cys_set):

residue =self.parm.residues[index]

residue.name ='CYX'

deffind_non_standard_resnames(self):

ns_names =set()

for residue inself.parm.residues:

iflen(residue.name) >3:

rname = residue.name[:3]

else:

rname = residue.name

if rname.strip() notinAMBER_SUPPORTED_RESNAMES:

ns_names.add(rname)

return ns_names

defadd_hydrogen(self, no_reduce_db=False):

'' Use reduce program to add hydrogen

Parameters

----------

obj: file object or parmed.Structure or its derived class

Returns

-------

parm : parmed.Structure

Requires

--------

reduce

deftouch(fname, times=None):

withopen(fname, 'a'):

os.utime(fname, times)

try:

if no_reduce_db:

touch('./dummydb')

fileobj = StringIO()

self.write_pdb(fileobj)

fileobj.seek(0)

reduce= os.path.join(os.getenv('AMBERHOME', ''), 'bin', 'reduce')

ifnot os.path.exists(reduce):

reduce='reduce'

if no_reduce_db:

process = subprocess.Popen(

[

reduce, '-BUILD', '-NUC', '-NOFLIP', '-DB ./dummydb',

'-'

stdin=subprocess.PIPE,

stdout=subprocess.PIPE,

stderr=subprocess.PIPE)

else:

process = subprocess.Popen(

[reduce, '-BUILD', '-NUC', '-NOFLIP', '-'],

stdin=subprocess.PIPE,

stdout=subprocess.PIPE,

stderr=subprocess.PIPE)

out, err = process.communicate(str.encode(fileobj.read()))

out = out.decode()

err = err.decode()

if process.wait():

logger.error('REDUCE returned non-zero exit status: '

'See reduce_info.log for more details')

# print out the reduce log even if it worked

withopen('reduce_info.log', 'w') as fh:

fh.write(err)

pdbh = StringIO(out)

# not using load_file since it does not read StringIO

self.parm = parmed.read_PDB(pdbh)

finally:

fileobj.close()

if no_reduce_db:

os.unlink('./dummydb')

returnself

defvisualize(self):

returnself.parm.visualize()

defwrite_pdb(self, filename):

Parameters

----------

filename : str or file object

self.parm.write_pdb(filename)

def_write_renum(self, basename):

'' write original and renumbered residue index

withopen(basename +'_renum.txt', 'w') as fh:

for residue inself.parm.residues:

fh.write('%3s%5s%3s%5sn'%

(residue.name, residue.number, residue.name,

residue.idx +1))

def_write_pdb_to_stringio(self,

cys_cys_atomidx_set=None,

disulfide_conect=True,

noter=False,

**kwargs):

stringio_file = StringIO()

stringio_file_out = StringIO()

self.parm.write_pdb(stringio_file, **kwargs)

stringio_file.seek(0)

lines = stringio_file.readlines()

#TODO: update ParmEd?

if disulfide_conect:

conect_record = [

'CONECT%5d%5dn'% (idx0 +1, idx1 +1)

for (idx0, idx1) in cys_cys_atomidx_set

]

conect_str =''.join(conect_record)

lines[-1] = conect_str +'ENDn'

if noter:

lines = [line for line in lines ifnot line.startswith('TER')]

stringio_file_out.writelines(lines)

stringio_file_out.seek(0)

return stringio_file_out

defremove_water(self):

'' Remove waters and return new `parm` with only waters

#TODO : add AMBER water names (TP3, ...)

water_mask =':'+','.join(parmed.residue.WATER_NAMES)

self.parm.strip(water_mask)

returnself

def_summary(self):

sumdict =dict(has_altlocs=False)

alt_residues =set()

chains =set()

for residue inself.parm.residues:

chains.add(residue.chain)

for atom in residue.atoms:

if atom.other_locations:

alt_residues.add(residue)

# chain

logger.info('n----------Chains')

logger.info('The following (original) chains have been found:')

for chain_name insorted(chains):

logger.info(chain_name)

# altlocs

logger.info('n---------- Alternate Locations (Original Residues!))')

logger.info('nThe following residues had alternate locations:')

if alt_residues:

sumdict['has_altlocs'] =True

for residue insorted(alt_residues):

logger.info('{}_{}'.format(residue.name, residue.number))

else:

logger.info('None')

return sumdict

defrun(

arg_pdbout,

arg_pdbin,

arg_nohyd=False,

arg_dry=False,

arg_prot=False,

arg_amber_compatible_residues=False,

arg_strip_atom_mask=None,

arg_mutate_string=None,

arg_constph=False,

arg_mostpop=False,

arg_reduce=False,

arg_no_reduce_db=False,

arg_model=0,

arg_add_missing_atoms=False,

arg_elbow=False,

arg_logfile='pdb4amber.log',

arg_keep_altlocs=False,

arg_leap_template=False,

arg_conect=True,

arg_noter=False, ):

# always reset handlers to avoid duplication if run method is called more

# than once

logger.handlers = []

ifisinstance(arg_logfile, string_types):

logfile_handler = logging.FileHandler(arg_logfile)

elifhasattr(arg_logfile, 'write'):

logfile_handler = logging.StreamHandler(arg_logfile)

else:

raiseValueError(

'wrong arg_logfile: must be either string or file object')

logger.addHandler(logfile_handler)

name = arg_pdbin ifnothasattr(arg_pdbin,

'__name__') else arg_pdbin.__name__

logger.info('n')

logger.info('Summary of pdb4amber for: %s'% name)

logger.info('')

if arg_pdbin arg_pdbout:

raiseRuntimeError(

'The input and output file names cannot be the same!n')

base_filename, extension = os.path.splitext(arg_pdbout)

if arg_pdbin 'stdin':

ifPY3:

pdbin = StringIO(sys.stdin.read())

else:

pdbin = sys.stdin

else:

pdbin = arg_pdbin

ifisinstance(pdbin, parmed.Structure):

parm = pdbin

elifhasattr(pdbin, 'read'):

# StringIO (e.g: read from pipe)

# need to use read_PDB

parm = parmed.read_PDB(pdbin)

else:

try:

parm = parmed.load_file(pdbin)

except (parmed.exceptions.FormatNotFound, IndexError):

sys.stderr.write('Warning: input file may not be a PDB file!n')

sys.stderr.write(' trying to process it as one anyway.n')

# go back to read_PDB

parm = parmed.read_PDB(pdbin)

pdbfixer = AmberPDBFixer(parm)

pdbfixer._write_renum(base_filename)

if arg_reduce:

pdbfixer.add_hydrogen(no_reduce_db=arg_no_reduce_db)

sumdict = pdbfixer._summary()

# remove hydrogens if option -y is used:

if arg_nohyd:

pdbfixer.parm.strip('@/H')

# find non-standard Amber residues:

#TODO: why does the following call discard the return array of

# non-standard residue names?

ns_names = pdbfixer.find_non_standard_resnames()

logger.info('-----------Non-standard-resnames')

logger.info(', '.join(ns_names))

ns_mask =':'+','.join(ns_names)

ns_mask_filename = base_filename +'_nonprot.pdb'

if ns_mask !=':':

pdbfixer.parm[ns_mask].save(ns_mask_filename, overwrite=True)

else:

withopen(ns_mask_filename, 'w') as fh:

fh.write('')

# if arg_elbow:

# ns_names = find_non_standard_resnames_elbow(parm)

# keep only protein:

if arg_prot:

pdbfixer.parm.strip('!:'+','.join(RESPROT))

if arg_amber_compatible_residues:

pdbfixer.parm.strip('!:'+','.join(AMBER_SUPPORTED_RESNAMES))

# strip atoms with given mask

if arg_strip_atom_mask isnotNone:

pdbfixer.parm.strip(arg_strip_atom_mask)

# remove water if -d option used:

if arg_dry:

water_mask =':'+','.join(parmed.residue.WATER_NAMES)

water_parm = pdbfixer.parm[water_mask]

pdbfixer.remove_water()

water_parm.save('{}_water.pdb'.format(base_filename), overwrite=True)

# find histidines that might have to be changed:

if arg_constph:

pdbfixer.constph()

else:

pdbfixer.assign_histidine()

# find possible S-S in the final protein:

sslist, cys_cys_atomidx_set = pdbfixer.find_disulfide()

pdbfixer.rename_cys_to_cyx(sslist)

withopen(base_filename +'_sslink', 'w') as fh:

for (idx0, idx1) in sslist:

fh.write('{}{}n'.format(idx0 +1, idx1 +1))

# find possible gaps:

gaplist = pdbfixer.find_gaps()

mask_str_list = []

if arg_mutate_string isnotNone:

# e.g: arg_mutate_str = '3-ALA,4-GLU'

for mask_str in arg_mutate_string.replace(';', ',').split(','):

index, resname = mask_str.split('-')

mask_str_list.append([int(index.strip()) -1, resname.strip()])

pdbfixer.mutate(mask_str_list)

# mutation will remove all hydrogens

# add back if using reduce

if arg_reduce:

pdbfixer.add_hydrogen(no_reduce_db=arg_no_reduce_db)

# count heavy atoms:

missing_atom_residues = pdbfixer.find_missing_heavy_atoms()

logger.info('n---------- Mising heavy atom(s)n')

if missing_atom_residues:

for (residue, n_missing) in missing_atom_residues:

logger.warn('{}_{} misses {} heavy atom(s)'.format(

residue.name, residue.idx +1, n_missing))

else:

logger.info('None')

if arg_add_missing_atoms:

pdbfixer.add_missing_atoms()

# make final output to new PDB file

if arg_model >=0:

final_coordinates = pdbfixer.parm.get_coordinates()[arg_model]

write_kwargs =dict(coordinates=final_coordinates)

else:

# keep all models

write_kwargs =dict()

write_kwargs['increase_tercount'] =False# so CONECT record can work properly

ifnot arg_keep_altlocs:

if sumdict['has_altlocs']:

logger.info('The alternate coordinates have been discarded.')

if arg_mostpop:

logger.info(

'Only the highest occupancy for each atom was kept.')

write_kwargs =dict(altlocs='occupancy')

else:

logger.info(

'Only the first occurrence for each atom was kept.')

write_kwargs =dict(altlocs='first')

# remove altlocs label

for atom in pdbfixer.parm.atoms:

atom.altloc =''

for oatom in atom.other_locations.values():

oatom.altloc =''

if arg_pdbout in ['stdout', 'stderr'] or arg_pdbout.endswith('.pdb'):

output = pdbfixer._write_pdb_to_stringio(

cys_cys_atomidx_set=cys_cys_atomidx_set,

disulfide_conect=arg_conect,

noter=arg_noter,

**write_kwargs)

output.seek(0)

if arg_pdbout in ['stdout', 'stderr']:

pdb_out_filename ='stdout.pdb'

print(output.read())

else:

pdb_out_filename = arg_pdbout

withopen(arg_pdbout, 'w') as fh:

fh.write(output.read())

else:

# mol2 does not accept altloc keyword

pdb_out_filename = arg_pdbout

pdbfixer.parm.save(pdb_out_filename, overwrite=True)

if arg_leap_template:

withopen('leap.template.in', 'w') as fh:

if arg_prot:

final_ns_names = []

else:

final_ns_names = ns_names

content = _make_leap_template(

parm,

final_ns_names,

gaplist,

sslist,

input_pdb=pdb_out_filename,

prmtop='prmtop',

rst7='rst7')

fh.write(content)

return ns_names, gaplist, sslist

defmain(argv=None):

parser = argparse.ArgumentParser()

parser.add_argument(

'input',

nargs='?',

help='PDB input file (default: stdin)', )

parser.add_argument(

'-i',

'--in',

metavar='FILE',

dest='pdbin',

help='PDB input file (default: stdin)',

default='stdin')

parser.add_argument(

'-o',

'--out',

metavar='FILE',

dest='pdbout',

help='PDB output file (default: stdout)',

default='stdout')

parser.add_argument(

'-y',

'--nohyd',

action='store_true',

dest='nohyd',

help='remove all hydrogen atoms (default: no)')

parser.add_argument(

'-d',

'--dry',

action='store_true',

dest='dry',

help='remove all water molecules (default: no)')

parser.add_argument(

'-s',

'--strip',

dest='strip_atom_mask',

default=None,

help='Strip given atom mask, (default: no)')

parser.add_argument(

'-m',

'--mutate',

dest='mutation_string',

default=None,

help='Mutate residue')

parser.add_argument(

'-p',

'--prot',

action='store_true',

dest='prot',

help='keep only protein residues (default: no)')

parser.add_argument(

'-a',

'--amber-compatible-residues',

action='store_true',

dest='amber_compatible_residues',

help='keep only Amber-compatible residues (default: no)')

parser.add_argument(

'--constantph',

action='store_true',

dest='constantph',

help='rename GLU,ASP,HIS for constant pH simulation')

parser.add_argument(

'--most-populous',

action='store_true',

dest='mostpop',

help='keep most populous alt. conf. (default is to keep 'A')')

parser.add_argument(

'--keep-altlocs',

action='store_true',

dest='keep_altlocs',

help='Keep alternative conformations')

parser.add_argument(

'--reduce',

action='store_true',

dest='reduce',

help='Run Reduce first to add hydrogens. (default: no)')

parser.add_argument(

'--no-reduce-db',

action='store_true',

dest='no_reduce_db',

help='If reduce is on, skip using it for hetatoms. (default: usual reduce behavior for hetatoms)')

parser.add_argument(

'--pdbid',

action='store_true',

dest='pdbid',

help='fetch structure with given pdbid, '

'should combined with -i option.n'

'Subjected to change')

parser.add_argument(

'--add-missing-atoms',

action='store_true',

dest='add_missing_atoms',

help='Use tleap to add missing atoms. (EXPERIMENTAL OPTION)')

parser.add_argument(

'--model',

type=int,

dest='model',

default=1,

help=

'Model to use from a multi-model pdb file (integer). (default: use 1st model). '

'Use a negative number to keep all models')

parser.add_argument(

'-l',

'--logfile',

metavar='FILE',

dest='logfile',

help='log filename',

default='stderr')

parser.add_argument(

'-v', '--version', action='store_true', dest='version', help='version')

parser.add_argument(

'--leap-template',

action='store_true',

dest='leap_template',

help='write a leap template for easy adaptionn(EXPERIMENTAL)')

parser.add_argument(

'--no-conect',

action='store_true',

dest='no_conect',

help='Not write S-S conect record')

parser.add_argument(

'--noter', action='store_true', dest='noter', help='Not writing TER')

opt = parser.parse_args(argv)

# pdbin : {str, file object, parmed.Structure}

if opt.version:

print(__version__)

if opt.input isnotNone:

pdbin = opt.input

else:

pdbin = opt.pdbin

if opt.pdbid:

pdbin = parmed.download_PDB(pdbin)

if opt.pdbin 'stdin'and opt.input isNone:

if os.isatty(sys.stdin.fileno()):

parser.print_help()

sys.exit(0)

if opt.logfile 'stderr':

logfile = sys.stderr

elif opt.logfile 'stdout':

logfile = sys.stdout

else:

logfile = opt.logfile

run(

arg_pdbout=opt.pdbout,

arg_pdbin=pdbin,

arg_nohyd=opt.nohyd,

arg_dry=opt.dry,

arg_strip_atom_mask=opt.strip_atom_mask,

arg_mutate_string=opt.mutation_string,

arg_prot=opt.prot,

arg_amber_compatible_residues=opt.amber_compatible_residues,

arg_constph=opt.constantph,

arg_mostpop=opt.mostpop,

arg_reduce=opt.reduce,

arg_no_reduce_db=opt.no_reduce_db,

arg_model=opt.model -1,

arg_keep_altlocs=opt.keep_altlocs,

arg_add_missing_atoms=opt.add_missing_atoms,

arg_logfile=logfile,

arg_leap_template=opt.leap_template,

arg_conect=not opt.no_conect,

arg_noter=opt.noter)

if__name__'__main__':

main()

Copy lines
Copy permalink

Permalink

Join GitHub today

GitHub is home to over 36 million developers working together to host and review code, manage projects, and build software together.

Find file Copy path

Cannot retrieve contributors at this time

import sys

import os

from modeller import*

from modeller.optimizers import molecular_dynamics, conjugate_gradients

from modeller.automodel import autosched

# mutate_model.py

# Usage: python mutate_model.py modelname respos resname chain > logfile

# Example: python mutate_model.py 1t29 1699 LEU A > 1t29.log

# Creates a single in silico point mutation to sidechain type and at residue position

# input by the user, in the structure whose file is modelname.pdb

# The conformation of the mutant sidechain is optimized by conjugate gradient and

# refined using some MD.

# Note: if the model has no chain identifier, specify ' for the chain argument.

defoptimize(atmsel, sched):

#conjugate gradient

for step in sched:

step.optimize(atmsel, max_iterations=200, min_atom_shift=0.001)

#md

refine(atmsel)

cg = conjugate_gradients()

cg.optimize(atmsel, max_iterations=200, min_atom_shift=0.001)

#molecular dynamics

defrefine(atmsel):

# at T=1000, max_atom_shift for 4fs is cca 0.15 A.

md = molecular_dynamics(cap_atom_shift=0.39, md_time_step=4.0,

md_return='FINAL')

init_vel =True

for (its, equil, temps) in ((200, 20, (150.0, 250.0, 400.0, 700.0, 1000.0)),

(200, 600,

(1000.0, 800.0, 600.0, 500.0, 400.0, 300.0))):

for temp in temps:

md.optimize(atmsel, init_velocities=init_vel, temperature=temp,

max_iterations=its, equilibrate=equil)

init_vel =False

#use homologs and dihedral library for dihedral angle restraints

defmake_restraints(mdl1, aln):

rsr = mdl1.restraints

rsr.clear()

s = selection(mdl1)

for typ in ('stereo', 'phi-psi_binormal'):

rsr.make(s, restraint_type=typ, aln=aln, spline_on_site=True)

for typ in ('omega', 'chi1', 'chi2', 'chi3', 'chi4'):

rsr.make(s, restraint_type=typ+'_dihedral', spline_range=4.0,

spline_dx=0.3, spline_min_points=5, aln=aln,

spline_on_site=True)

#first argument

modelname, respos, restyp, chain,pdb_filename, out_name = sys.argv[1:]

log.verbose()

# Set a different value for rand_seed to get a different final model

env = environ(rand_seed=-49837)

env.io.hetatm =True

#soft sphere potential

env.edat.dynamic_sphere=False

#lennard-jones potential (more accurate)

env.edat.dynamic_lennard=True

env.edat.contact_shell =4.0

env.edat.update_dynamic =0.39

# Read customized topology file with phosphoserines (or standard one)

env.libs.topology.read(file='$(LIB)/top_heav.lib')

# Read customized CHARMM parameter library with phosphoserines (or standard one)

env.libs.parameters.read(file='$(LIB)/par.lib')

# Read the original PDB file and copy its sequence to the alignment array:

mdl1 = model(env, file=pdb_filename)

ali = alignment(env)

ali.append_model(mdl1, atom_files=pdb_filename, align_codes=modelname)

#set up the mutate residue selection segment

s = selection(mdl1.chains[chain].residues[respos])

#perform the mutate residue operation

s.mutate(residue_type=restyp)

#get two copies of the sequence. A modeller trick to get things set up

ali.append_model(mdl1, align_codes=modelname)

# Generate molecular topology for mutant

mdl1.clear_topology()

mdl1.generate_topology(ali[-1])

# Transfer all the coordinates you can from the template native structure

# to the mutant (this works even if the order of atoms in the native PDB

# file is not standard):

#here we are generating the model by reading the template coordinates

mdl1.transfer_xyz(ali)

# Build the remaining unknown coordinates

mdl1.build(initialize_xyz=False, build_method='INTERNAL_COORDINATES')

#yes model2 is the same file as model1. It's a modeller trick.

mdl2 = model(env, file=pdb_filename)

#required to do a transfer_res_numb

#ali.append_model(mdl2, atom_files=modelname, align_codes=modelname)

#transfers from 'model 2' to 'model 1'

mdl1.res_num_from(mdl2,ali)

#It is usually necessary to write the mutated sequence out and read it in

#before proceeding, because not all sequence related information about MODEL

#is changed by this command (e.g., internal coordinates, charges, and atom

#types and radii are not updated).

mdl1.write(file=modelname+restyp+respos+chain+'.tmp')

mdl1.read(file=modelname+restyp+respos+chain+'.tmp')

#set up restraints before computing energy

#we do this a second time because the model has been written out and read in,

#clearing the previously set restraints

make_restraints(mdl1, ali)

#a non-bonded pair has to have at least as many selected atoms

mdl1.env.edat.nonbonded_sel_atoms=1

sched = autosched.loop.make_for_model(mdl1)

#only optimize the selected residue (in first pass, just atoms in selected

#residue, in second pass, include nonbonded neighboring atoms)

#set up the mutate residue selection segment

s = selection(mdl1.chains[chain].residues[respos])

mdl1.restraints.unpick_all()

mdl1.restraints.pick(s)

s.energy()

s.randomize_xyz(deviation=4.0)

mdl1.env.edat.nonbonded_sel_atoms=2

optimize(s, sched)

#feels environment (energy computed on pairs that have at least one member

#in the selected)

mdl1.env.edat.nonbonded_sel_atoms=1

optimize(s, sched)

s.energy()

#give a proper name

mdl1.write(file=out_name)

#delete the temporary file

os.remove(modelname+restyp+respos+chain+'.tmp')

Copy lines
Copy permalink