from prody import *
# checkUpdates() # no longer works!

import prody as pd
from prody import parsePDB

ubi = parsePDB('1ubi')

ubi

ubi.numAtoms()

calcGyradius(ubi)

%matplotlib inline
showProtein(ubi)

import py3Dmol
showProtein(ubi)

saveAtoms(ubi)

writePDB('ubi.pdb', ubi)

parsePDB(writePDB('ubi.pdb', ubi))

ag = parsePDB('1vrt')

type(ag)

ag.numAtoms()

ag.numCoordsets()

names = ag.getNames()

names

len(names)

print(names[0])

ag.getBetas()

zeros = [0] * len(ag) # same as ag.numAtoms()
ag.setBetas(zeros)

ag.getBetas()

a0 = ag[0]
print(a0)

a0.getName()

a0.getBeta() # we had just set it to zero

eoa = ag[::2] # eoa: every other atom
print(eoa)

print(len(eoa))
print(len(ag))

eoa.getNames()

ag.numChains()

ag.numResidues()

showProtein(ag)

for ch in ag.iterChains():
    print('%s - %d residues' % (str(ch), ch.numResidues()))

for ch in ag.iterChains():
    print(ch)
    for res in ch:
        print(' |-%s' % res)
        break
    print('...')

chA = ag['A']
print(chA)
type(chA)

chA_res10 = ag['A', 10]
print(chA_res10)
type(chA_res10)

chA_res10.getNames()

chA_res10.numAtoms()

sel = ag.select('protein and name CA')
print(sel)
print('# of atoms: %d' % sel.numAtoms())
set(sel.getNames())

ag.select('ca') == ag.select('calpha') == ag.select('protein and name CA')

kinase = parsePDB('3erk')
bindingsite = kinase.select('within 5 of (hetero and not water)')
print('# of atoms: %d' % bindingsite.numAtoms())
print(set(bindingsite.getResnames()))

noligand = kinase.select('exwithin 5 of (hetero and not water)')
print('# of atoms: %d' % noligand.numAtoms())
print(set(noligand.getResnames()))

import numpy as np
origin = np.zeros(3)
print(origin)
sel = ag.select('within 10 of origin', origin=origin)
sel

calcDistance(sel, origin)[:5]

ag.select('within 5 of center',center = calcCenter(ag))

ag.calpha

ag.name_CA_and_resname_ALA

ubi = parsePDB('2k39')

ubi.numCoordsets()

ubi.getACSIndex()

coords = ubi.getCoords()
coords.mean(axis=0)

ubi.setACSIndex(115)
ubi.getCoords().mean(axis=0)

ubi_ca = ubi.calpha
ubi_ca.getACSIndex()

ubi_ca.setACSIndex(0)
print(ubi_ca.getACSIndex())
print(ubi.getACSIndex())

ag.copy()

ca = ag.select('ca')
ca.copy()

ag_copy = ag.copy()
moveAtoms(ag_copy, by=np.array([50, 50, 50]))
ag_copy['A'].setChid('C')
ag_copy['B'].setChid('D')
ag_new = ag + ag_copy
showProtein(ag_new)

ag.calpha in ag.backbone

ag.backbone in ag.protein

ag.water in ag.protein

ag.water in ag

chA = ag.chain_A
chB = ag.chain_B

print(chA & chB) # intersection

sel = chA | chB # union

sel.getSelstr()

~chA #not

atoms = parsePDB('1p38')
atoms.getResnums()

resnum_fract = atoms.getResnums() / 10.
resnum_fract

atoms.setData('resnumfract', resnum_fract)
atoms.getData('resnumfract')

saveAtoms(atoms)

atoms = loadAtoms('1p38.ag.npz')
atoms.getData('resnumfract')

fetchPDB('1p38', '1r39', '@!~#') # searches working directory, local resources, then downloads

fetchPDBviaHTTP('1p38')
fetchPDBviaFTP('1p38')

p38 = parsePDB('1p38')
bound = parsePDB('1zz2')

showProtein(p38, bound)

apo_chA, bnd_chA, seqid, overlap = matchChains(p38, bound)[0]
print(bnd_chA)
print(seqid)
print(overlap)

print(len(apo_chA),len(bnd_chA),len(p38),len(bound))

set(apo_chA.getNames())

calcRMSD(apo_chA, bnd_chA)

bnd_chA, transformation = superpose(bnd_chA, apo_chA)
calcRMSD(bnd_chA, apo_chA)

showProtein(p38, bound)

# parse the monomer structure and PDB file header information
# the header includes transformations for forming tetramer
monomer, header = parsePDB('1k4c', header=True)
monomer

showProtein(monomer, legend=True)

without_K = monomer.not_name_K
without_K

tetramer = buildBiomolecules(header, without_K)
tetramer

showProtein(tetramer)

Protein dynamics with ProDy¶

Import from ProDy¶

ProDy API naming conventions¶

Function names¶

Class names¶

Class method names¶

Usage example¶

Visualization¶

Better visualization¶

How many atoms does PDB 3ERK have?¶

File handling¶

Structures and AtomGroups¶

Some AtomGroup methods¶

Getters¶

Setters¶

Atom instances¶

Subset of atoms¶

Hierarchical Views¶

Iterations¶

Indexing¶

Atom Selections¶

Selecting by distance¶

How many non-water protein atoms are there within 5A of SB4?¶

Keyword arguments¶

Dot selection shorthand¶

Coordinate Sets¶

Coordinates¶

Operations with Atoms¶

Copying atoms¶

AtomGroup addition¶

AtomGroup membership¶

Selection operations¶

Store data in AtomGroup¶

Saving to files¶

PDB Access¶

Fetch PDB files¶

Comparing and aligning structures¶

Chain matching and RMSD¶

Align chains¶

Building biomolecules¶

Building biomolecules¶

Structures and `AtomGroups`¶

Some `AtomGroup` methods¶

`Atom` instances¶

`AtomGroup` addition¶

`AtomGroup` membership¶

`Selection` operations¶

Store data in `AtomGroup`¶