from prody import *
from numpy import *
from matplotlib.pyplot import *
%matplotlib inline
confProDy(auto_show=False)
confProDy(auto_secondary=True)

@> ProDy is configured: auto_show=False
@> ProDy is configured: auto_secondary=True


# parsePDB?


p38 = parsePDB('1p38', compressed=False)
p38

@> PDB file is found in working directory (1p38.pdb).
@> 2962 atoms and 1 coordinate set(s) were parsed in 0.07s.
@> Secondary structures were assigned to 188 residues.

<AtomGroup: 1p38 (2962 atoms)>


showProtein(p38);
legend();


coords = p38.getCoords()


coords.shape

(2962, 3)


showContactMap(p38.ca);

@> Kirchhoff was built in 0.03s.


p38[10]

<Atom: CA from 1p38 (index 10)>


p38[10].getCoords()

array([24.179,  4.807, 21.907])


showProtein(p38);
ax3d = gca()
x, y, z = p38[10].getCoords()
ax3d.plot([x], [y], [z], 'bo', markersize=20);


p38['A']

<Chain: A from 1p38 (480 residues, 2962 atoms)>


p38['A'].getSequence()

'ERPTFYRQELNKTIWEVPERYQNLSPVGSGAYGSVCAAFDTKTGHRVAVKKLSRPFQSIIHAKRTYRELRLLKHMKHENVIGLLDVFTPARSLEEFNDVYLVTHLMGADLNNIVKCQKLTDDHVQFLIYQILRGLKYIHSADIIHRDLKPSNLAVNEDCELKILDFGLARHTDDEMTGYVATRWYRAPEIMLNWMHYNQTVDIWSVGCIMAELLTGRTLFPGTDHIDQLKLILRLVGTPGAELLKKISSESARNYIQSLAQMPKMNFANVFIGANPLAVDLLEKMLVLDSDKRITAAQALAHAYFAQYHDPDDEPVADPYDQSFESRDLLIDEWKSLTYDEVISFVPPPLD'


p38[10].getResnum()

5


p38['A', 5]

<Residue: ARG 5 from Chain A from 1p38 (11 atoms)>


p38['A', 5].getNames()

array(['N', 'CA', 'C', 'O', 'CB', 'CG', 'CD', 'NE', 'CZ', 'NH1', 'NH2'],
      dtype='<U6')


hv = p38.getHierView()


hv['A', 5]

<Residue: ARG 5 from Chain A from 1p38 (11 atoms)>


betas = p38.getBetas()
betas.shape

(2962,)


p38.ca

<Selection: 'ca' from 1p38 (351 atoms)>


betas = p38.ca.getBetas()
betas.shape

(351,)


plot(betas);
xlabel('Residue index');
ylabel('B-factor');


showAtomicLines(betas, atoms=p38.ca);
xlabel('Residue number');
ylabel('B-factor');


p38.ca.getSecstrs()

array(['C', 'C', 'C', 'C', 'E', 'E', 'E', 'E', 'E', 'E', 'C', 'C', 'E',
       'E', 'E', 'E', 'E', 'E', 'C', 'C', 'C', 'C', 'C', 'C', 'E', 'E',
       'E', 'E', 'C', 'C', 'C', 'C', 'E', 'E', 'E', 'E', 'E', 'E', 'E',
       'C', 'C', 'C', 'C', 'C', 'C', 'E', 'E', 'E', 'E', 'E', 'E', 'E',
       'C', 'C', 'C', 'C', 'C', 'C', 'H', 'H', 'H', 'H', 'H', 'H', 'H',
       'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'C', 'C', 'C', 'C',
       'C', 'C', 'C', 'C', 'C', 'C', 'E', 'E', 'E', 'C', 'C', 'C', 'C',
       'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'E', 'E', 'E', 'E', 'E',
       'C', 'C', 'C', 'C', 'C', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'C',
       'C', 'C', 'C', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H',
       'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'C', 'C',
       'C', 'C', 'C', 'C', 'C', 'C', 'G', 'G', 'G', 'E', 'E', 'E', 'C',
       'C', 'C', 'C', 'C', 'E', 'E', 'E', 'C', 'C', 'C', 'C', 'C', 'C',
       'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'H', 'H',
       'H', 'H', 'H', 'C', 'C', 'H', 'H', 'H', 'H', 'C', 'C', 'C', 'C',
       'C', 'C', 'C', 'G', 'G', 'G', 'G', 'G', 'G', 'G', 'G', 'G', 'G',
       'G', 'G', 'G', 'G', 'G', 'G', 'G', 'C', 'C', 'C', 'C', 'C', 'C',
       'C', 'C', 'C', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H',
       'H', 'H', 'C', 'C', 'C', 'C', 'H', 'H', 'H', 'H', 'H', 'H', 'C',
       'C', 'C', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'C', 'C',
       'C', 'C', 'C', 'C', 'C', 'C', 'G', 'G', 'G', 'C', 'C', 'C', 'C',
       'C', 'C', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'C',
       'C', 'C', 'C', 'G', 'G', 'G', 'C', 'C', 'C', 'H', 'H', 'H', 'H',
       'H', 'C', 'C', 'G', 'G', 'G', 'C', 'C', 'C', 'C', 'C', 'G', 'G',
       'G', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'G', 'G', 'G',
       'G', 'C', 'C', 'C', 'C', 'H', 'H', 'H', 'H', 'H', 'H', 'H', 'H',
       'H', 'H', 'H', 'H', 'H', 'C', 'C', 'C', 'C', 'C', 'C', 'C', 'C'],
      dtype='<U1')


''.join(p38.ca.getSecstrs())

'CCCCEEEEEECCEEEEEECCCCCCEEEECCCCEEEEEEECCCCCCEEEEEEECCCCCCHHHHHHHHHHHHHHHHCCCCCCCCCCEEECCCCCCCCCCCCEEEEECCCCCHHHHHHHCCCCHHHHHHHHHHHHHHHHHHHHHCCCCCCCCGGGEEECCCCCEEECCCCCCCCCCCCCCCCCHHHHHCCHHHHCCCCCCCGGGGGGGGGGGGGGGGGCCCCCCCCCHHHHHHHHHHHHCCCCHHHHHHCCCHHHHHHHHHCCCCCCCCGGGCCCCCCHHHHHHHHHHCCCCGGGCCCHHHHHCCGGGCCCCCGGGCCCCCCCCCGGGGCCCCHHHHHHHHHHHHHCCCCCCCC'

p38

<AtomGroup: 1p38 (2962 atoms)>


calcPhi(p38['A', 10])

-115.5351427673999


chain = p38['A']
Phi = []; Psi = []; c = []
for res in chain.iterResidues():
    try:
        phi = calcPhi(res)
        psi = calcPsi(res)
    except:
        continue
    else:
        Phi.append(phi)
        Psi.append(psi)
        if res.getResname() == 'GLY':
            c.append('black')
        else:
            secstr = res.getSecstrs()[0]
            if secstr == 'H':
                c.append('red')
            elif secstr == 'G':
                c.append('darkred')
            elif secstr == 'E':
                c.append('blue')
            else:
                c.append('grey')


scatter(Phi, Psi, c=c, s=10);
xlabel('Phi (degree)');
ylabel('Psi (degree)');


ca = p38.select('calpha')
ca

<Selection: 'calpha' from 1p38 (351 atoms)>


bb = p38.select('backbone')
bb

<Selection: 'backbone' from 1p38 (1404 atoms)>


chainA_ca = parsePDB('1p38', chain='A', subset='ca')

@> PDB file is found in working directory (1p38.pdb.gz).
@> 351 atoms and 1 coordinate set(s) were parsed in 0.02s.
@> Secondary structures were assigned to 188 residues.


chA = p38.select('calpha and chain A')
chA

<Selection: 'calpha and chain A' from 1p38 (351 atoms)>


res = p38.ca.select('chain A and resnum 10')
res.getResnums()

array([10])


res = p38.ca.select('chain A and resnum 10 11 12')
res.getResnums()

array([10, 11, 12])


head = p38.ca.select('resnum < 50')
head.numAtoms()

46


fragment = p38.ca.select('resnum 50 to 100')


subbetas = sliceAtomicData(betas, atoms=p38.ca, select=fragment)


showAtomicLines(subbetas, atoms=fragment);
xlabel('Residue number');
ylabel('B factor');


showAtomicLines(betas, atoms=p38.ca, overlay=True);
showAtomicLines(subbetas, atoms=fragment, overlay=True);
xlabel('Residue number');
ylabel('B factor');


args = p38.ca.select('resname ARG')
args

<Selection: '(resname ARG) and (ca)' from 1p38 (19 atoms)>


argbetas = sliceAtomicData(betas, atoms=p38.ca, select=args)
showAtomicLines(betas, atoms=p38.ca, overlay=True);
showAtomicLines(argbetas, atoms=args, linespec='r*', overlay=True);
xlabel('Residue number');
ylabel('B factor');


bound = parsePDB('1zz2', compressed=False)

@> PDB file is found in working directory (1zz2.pdb).
@> 2872 atoms and 1 coordinate set(s) were parsed in 0.06s.
@> Secondary structures were assigned to 220 residues.


results = matchChains(p38, bound)
results[0]

@> Checking AtomGroup 1p38: 1 chains are identified
@> Checking AtomGroup 1zz2: 1 chains are identified
@> Trying to match chains based on residue numbers and names:
@>   Comparing Chain A from 1p38 (len=351) and Chain A from 1zz2 (len=337):
@> 	Match: 337 residues match with 99% sequence identity and 96% overlap.

(<AtomMap: Chain A from 1p38 -> Chain A from 1zz2 from 1p38 (337 atoms)>,
 <AtomMap: Chain A from 1zz2 -> Chain A from 1p38 from 1zz2 (337 atoms)>,
 99.40652818991099,
 96.01139601139602)


apo_chA, bnd_chA, seqid, overlap = results[0]


apo_chA

<AtomMap: Chain A from 1p38 -> Chain A from 1zz2 from 1p38 (337 atoms)>


bnd_chA

<AtomMap: Chain A from 1zz2 -> Chain A from 1p38 from 1zz2 (337 atoms)>


seqid

99.40652818991099


overlap

96.01139601139602


calcRMSD(bnd_chA, apo_chA)

72.93023086946586


showProtein(bnd_chA);
showProtein(apo_chA);
legend();


bnd_chA, transformation = superpose(bnd_chA, apo_chA)
calcRMSD(bnd_chA, apo_chA)

@> WARNING mobile is an AtomMap instance, consider assign weights=mobile.getFlags("mapped") if there are dummy atoms in mobile
@> WARNING target is an AtomMap instance, consider assign weights=target.getFlags("mapped") if there are dummy atoms in target

1.862801490869549


showProtein(bnd_chA);
showProtein(apo_chA);
legend();


showProtein(p38);
showProtein(bound);
legend();


import py3Dmol
showProtein(p38)

<py3Dmol.view at 0x123b1b790>


writePDB('bound_aligned.pdb', bnd_chA)

'bound_aligned.pdb'

Prody Basics

Loading PDB files and visualization¶

Retrieving data from an AtomGroup¶

Selection¶

Compare and align structures¶

Advanced Visualization¶