%%html
<script src="http://bits.csb.pitt.edu/asker.js/lib/asker.js"></script>
<script>
$3Dmolpromise = new Promise((resolve, reject) => { 
    require(['https://3dmol.org/build/3Dmol-nojquery.js'], function(){       
            resolve();});
});

require(['https://cdnjs.cloudflare.com/ajax/libs/Chart.js/2.2.2/Chart.js'], function(Ch){
 Chart = Ch;
});

$('head').append('<link rel="stylesheet" href="http://bits.csb.pitt.edu/asker.js/themes/asker.default.css" />');


//the callback is provided a canvas object and data 
var chartmaker = function(canvas, labels, data) {
  var ctx = $(canvas).get(0).getContext("2d");
     var dataset = {labels: labels,                     
    datasets:[{
     data: data,
     backgroundColor: "rgba(150,64,150,0.5)",
         fillColor: "rgba(150,64,150,0.8)",    
  }]};
  var myBarChart = new Chart(ctx,{type:'bar',data:dataset,options:{legend: {display:false},
        scales: {
            yAxes: [{
                ticks: {
                    min: 0,
                }
            }]}}});
};

$(".jp-InputArea .o:contains(html)").closest('.jp-InputArea').hide();

</script>


from prody import *
import py3Dmol
ubi = parsePDB('2lz3')
print(ubi.numCoordsets())

21


showProtein(ubi)

<py3Dmol.view at 0x7f31887d8310>


ubi_ensemble = Ensemble(ubi.calpha)
print("Before iterpose",ubi_ensemble.getRMSDs().mean())
ubi_ensemble.iterpose()
print("After iterpose",ubi_ensemble.getRMSDs().mean())

Before iterpose 8.253871223076873

@> Superposing  [100%] 0s

After iterpose 0.724626075587582


help(ubi_ensemble.iterpose)

Help on method iterpose in module prody.ensemble.ensemble:

iterpose(rmsd=0.0001, quiet=False) method of prody.ensemble.ensemble.Ensemble instance
    Iteratively superpose the ensemble until convergence.  Initially,
    all conformations are aligned with the reference coordinates.  Then
    mean coordinates are calculated, and are set as the new reference
    coordinates.  This is repeated until reference coordinates do not
    change.  This is determined by the value of RMSD between the new and
    old reference coordinates.  Note that at the end of the iterative
    procedure the reference coordinate set will be average of conformations
    in the ensemble.
    
    :arg rmsd: change in reference coordinates to determine convergence,
        default is 0.0001 Å RMSD
    :type rmsd: float


%%html

<div id="pca" style="width: 500px"></div>
<script>
$('head').append('<link rel="stylesheet" href="http://bits.csb.pitt.edu/asker.js/themes/asker.default.css" />');

    var divid = '#pca';
	jQuery(divid).asker({
	    id: divid,
	    question: "PCA works well for high-dimensional data.",
		answers: ['True','False'],
        server: "http://bits.csb.pitt.edu/asker.js/example/asker.cgi",
		charter: chartmaker})
    
$(".jp-InputArea .o:contains(html)").closest('.jp-InputArea').hide();


</script>


pca = PCA('ubi')

pca.buildCovariance(ubi_ensemble)
cov = pca.getCovariance()


%%html
<div id="prodyc" style="width: 500px"></div>
<script>
$('head').append('<link rel="stylesheet" href="http://bits.csb.pitt.edu/asker.js/themes/asker.default.css" />');

    var divid = '#prodyc';
	jQuery(divid).asker({
	    id: divid,
	    question: "What is the shape of the covariance matrix? We have 21 conformations and 56 atoms.",
		answers: ["56x56","21x56","21x168","168x168","63x56"],
        server: "http://bits.csb.pitt.edu/asker.js/example/asker.cgi",
		charter: chartmaker})
    
$(".jp-InputArea .o:contains(html)").closest('.jp-InputArea').hide();


</script>


cov.shape

(168, 168)


help(pca.calcModes)
pca.calcModes()

Help on method calcModes in module prody.dynamics.pca:

calcModes(n_modes=20, turbo=True) method of prody.dynamics.pca.PCA instance
    Calculate principal (or essential) modes.  This method uses
    :func:`scipy.linalg.eigh`, or :func:`numpy.linalg.eigh`, function
    to diagonalize the covariance matrix.
    
    :arg n_modes: number of non-zero eigenvalues/vectors to calculate,
        default is 20,
        if **None** or ``'all'`` is given, all modes will be calculated
    :type n_modes: int
    
    :arg turbo: when available, use a memory intensive but faster way to
        calculate modes, default is **True**
    :type turbo: bool


pca[0].getEigval() #mode zero - has highest variance

18.28368776087946


pca[0].getVariance() #same as eigen value

18.28368776087946


pca[0].getEigvec() #these are the contributions of each coordinate to this mode

array([ 0.10895504, -0.09862288, -0.00069774,  0.12734766, -0.09529924,
        0.01728582,  0.09240989, -0.10821783, -0.00378215,  0.07455981,
       -0.09152148,  0.00040461,  0.08382771, -0.07502066,  0.01207025,
        0.07575377, -0.08990909,  0.00535893,  0.03427309, -0.07144482,
       -0.00699088,  0.04409968, -0.03099255,  0.00834164,  0.07587458,
       -0.04170089,  0.00526682,  0.05191522, -0.07196191,  0.00379224,
        0.02259604, -0.05094133,  0.00640529,  0.04676089, -0.02941339,
        0.00849644,  0.0464955 , -0.05902509,  0.00232354, -0.01470513,
       -0.03835522,  0.00499573, -0.00278386, -0.00494205,  0.0264534 ,
        0.0029671 , -0.00770994,  0.0295055 , -0.00796946, -0.01000113,
        0.01861126, -0.01755458,  0.01802547,  0.00189692,  0.00765933,
        0.04189029,  0.0244628 ,  0.00835689,  0.01903618,  0.02190465,
       -0.0441638 ,  0.03989105, -0.01788036, -0.02619707,  0.12531529,
       -0.02848483,  0.0543055 ,  0.13310853,  0.02580789, -0.00745104,
        0.07604764,  0.01393704, -0.08793328,  0.19185374, -0.09044218,
        0.04279204,  0.30141262, -0.08296667,  0.11576725,  0.26290306,
       -0.04763831, -0.06185247,  0.22253404, -0.09664783, -0.09239755,
        0.08881437,  0.07226983, -0.09992072,  0.07962558,  0.09435603,
       -0.07784717,  0.09881887,  0.06423209, -0.06198042,  0.08361729,
        0.05641675, -0.06530563,  0.06444374,  0.06652602, -0.05987737,
        0.08049509,  0.06075073, -0.03014279,  0.0685254 ,  0.02757251,
       -0.03427367,  0.02589602,  0.03518655, -0.06263196,  0.03504964,
        0.04866357, -0.04070921,  0.06486652,  0.0448722 , -0.01563442,
        0.04627099,  0.02900357, -0.03654269,  0.02419248,  0.03591002,
       -0.0370253 ,  0.05321956,  0.03747252,  0.01672878,  0.0365496 ,
        0.00822769,  0.01449845, -0.00095547,  0.0234832 ,  0.01170215,
       -0.00056749,  0.02890748,  0.01599113,  0.00464259,  0.01497787,
        0.01513886, -0.01650674, -0.01017376,  0.00189782, -0.04663787,
        0.01382682,  0.0014967 , -0.02525573,  0.01747316,  0.0288226 ,
       -0.03194735, -0.04478236,  0.00333668, -0.11138434, -0.06761427,
       -0.04450923, -0.13827834,  0.01175396,  0.00818127, -0.07764186,
       -0.01066473,  0.02718498, -0.15660379, -0.16482202, -0.09226899,
       -0.27114029, -0.12982267, -0.13956175, -0.24849636, -0.05827123,
       -0.00045689, -0.18655049, -0.16752135])


for mode in pca[:4]:
    print(calcFractVariance(mode).round(2))

0.54
0.25
0.08
0.05


calcFractVariance(pca)

array([5.44746801e-01, 2.45008121e-01, 7.53087244e-02, 4.76585603e-02,
       2.48514775e-02, 1.89408289e-02, 1.10784476e-02, 8.86489115e-03,
       6.56613195e-03, 4.91503637e-03, 3.31646501e-03, 2.68053785e-03,
       2.10061548e-03, 1.53720323e-03, 8.39347607e-04, 5.63728260e-04,
       3.87769668e-04, 3.44092597e-04, 1.89852401e-04, 1.01367370e-04])


calcFractVariance(pca).sum()

1.0000000000000004


pca.getVariances()

array([1.82836878e+01, 8.22336538e+00, 2.52763522e+00, 1.59959496e+00,
       8.34106146e-01, 6.35723241e-01, 3.71833071e-01, 2.97538052e-01,
       2.20383316e-01, 1.64966531e-01, 1.11312651e-01, 8.99686184e-02,
       7.05043103e-02, 5.15941421e-02, 2.81715643e-02, 1.89207747e-02,
       1.30149631e-02, 1.15490015e-02, 6.37213842e-03, 3.40225833e-03])


pca.getVariances()/pca.getVariances().sum()

array([5.44746801e-01, 2.45008121e-01, 7.53087244e-02, 4.76585603e-02,
       2.48514775e-02, 1.89408289e-02, 1.10784476e-02, 8.86489115e-03,
       6.56613195e-03, 4.91503637e-03, 3.31646501e-03, 2.68053785e-03,
       2.10061548e-03, 1.53720323e-03, 8.39347607e-04, 5.63728260e-04,
       3.87769668e-04, 3.44092597e-04, 1.89852401e-04, 1.01367370e-04])


%matplotlib inline
showSqFlucts(pca);


showProtein(ubi,data=calcSqFlucts(pca))

<py3Dmol.view at 0x7f3188519ca0>


showProjection(ubi_ensemble, pca[:2]);


showProjection(ubi_ensemble, pca[:3]);

/home/anupam06/anaconda3/lib/python3.9/site-packages/prody/dynamics/plotting.py:327: MatplotlibDeprecationWarning: Axes3D(fig) adding itself to the figure is deprecated since 3.4. Pass the keyword argument auto_add_to_figure=False and use fig.add_axes(ax) to suppress this warning. The default value of auto_add_to_figure will change to False in mpl3.5 and True values will no longer work in 3.6.  This is consistent with other Axes classes.
  show = Axes3D(cf)


%%html
<div id="prodyp" style="width: 500px"></div>
<script>
$('head').append('<link rel="stylesheet" href="http://bits.csb.pitt.edu/asker.js/themes/asker.default.css" />');

    var divid = '#prodyp';
	jQuery(divid).asker({
	    id: divid,
	    question: "What do the dots on the previous picture represent?",
		answers: ["Conformations","Atoms","Modes","Fluctuations","Covariance"],
        server: "http://bits.csb.pitt.edu/asker.js/example/asker.cgi",
		charter: chartmaker})
    
$(".jp-InputArea .o:contains(html)").closest('.jp-InputArea').hide();


</script>


anm, atoms = calcANM(ubi, selstr='calpha')


anm = ANM('Ubi')
anm.buildHessian(ubi.calpha)
anm.calcModes(n_modes=20)


slowest_mode = anm[0]
print(slowest_mode)
print(slowest_mode.getEigval().round(3))

Mode 1 from ANM Ubi
0.082


len(slowest_mode.getEigvec())

168


calcFractVariance(anm)

array([0.24980938, 0.24410503, 0.08996715, 0.07112073, 0.03707691,
       0.03623665, 0.0321058 , 0.02797792, 0.02703105, 0.0237444 ,
       0.02140593, 0.01979188, 0.01878154, 0.01573741, 0.0154018 ,
       0.01493917, 0.01476959, 0.01402273, 0.01320577, 0.01276915])


oneubi = ubi
while oneubi.numCoordsets() > 1:
    oneubi.delCoordset(-1)
showProtein(oneubi,mode=slowest_mode,data=calcSqFlucts(anm),anim=True,scale=25)

<py3Dmol.view at 0x7f31882f8d90>


showProtein(oneubi,mode=anm[1].getEigvec(),data=calcSqFlucts(anm),anim=True,amplitude=25)

<py3Dmol.view at 0x7f31882ec790>


printOverlapTable(pca[:4], anm[:4])

Overlap Table
                      ANM Ubi
               #1     #2     #3     #4
PCA ubi #1    0.00  +0.74   0.00  +0.20
PCA ubi #2    0.00  +0.20   0.00  -0.36
PCA ubi #3   +0.01  +0.04   0.00  -0.26
PCA ubi #4   +0.01  +0.33   0.00  -0.07


showOverlapTable(pca[:4], anm[:4]);


showProtein(oneubi,data=calcSqFlucts(pca[0]),mode=pca[0].getEigvec(),anim=True,amplitude=25)

<py3Dmol.view at 0x7f31887d8100>


import prody
import py3Dmol
import io

pdb = '2l3y' # 2lz3
prot = prody.parsePDB(pdb)
ensemble = prody.Ensemble(prot.ca)
ensemble.iterpose()
pca = prody.PCA()
pca.buildCovariance(ensemble)
pca.calcModes()
flucts = prody.calcSqFlucts(pca)
print("Min/Max Flucts %.2f %.2f"%(flucts.min(),flucts.max()))
prot.setBetas(0) #not actually necessary
prot.ca.setBetas(flucts)

#I feel like there should be a more succinct way to remove
#all but the first coordinate set, but I can't find it
n = len(prot.getCoordsets())
singleprot = prot
singleprot.delCoordset(range(1,n))

#instead of write to a file to get the pdb string, 
#can write to a stringIO, which acts like a file
pdbstr = io.StringIO()
prody.writePDBStream(pdbstr, singleprot)

view = py3Dmol.view()
view.addModel(pdbstr.getvalue())
view.setStyle({'cartoon':{'colorscheme':{'prop':'b','gradient':'sinebow','min':flucts.min(),'max':flucts.max()}}})
view.zoomTo()

@> Superposing  [100%] 0s

Min/Max Flucts 0.33 144.97

<py3Dmol.view at 0x7f316a81d850>

ProDy¶

10/4/2022¶

Dynamics Analysis¶

PCA calculations¶

What is PCA?¶

PCA calculations¶

PCA Calculations¶

PCA Calculations¶

Variance¶

Fluctuations¶

Projection¶

Projection¶

Elastic Network Model¶

ANM calculations¶

ANM¶

Mode 2¶

Compare PCA and ANM¶

Mode 1 of PCA¶

ProDy Docs and Tutorials¶

Project¶