|
| 1 | + |
| 2 | + |
| 3 | +```python |
| 4 | +# Default Libraries |
| 5 | +import os |
| 6 | +import StringIO |
| 7 | + |
| 8 | +# External Libraries |
| 9 | +import pandas as pd |
| 10 | +import numpy as np |
| 11 | +import matplotlib |
| 12 | +import matplotlib.pyplot as plt |
| 13 | +import seaborn as sns |
| 14 | +import networkx as nx |
| 15 | +from IPython.display import FileLink, FileLinks |
| 16 | + |
| 17 | +# Own Libraries |
| 18 | +import rstoolbox # Learn about this library at: http://lpdi-epfl.github.io/RosettaSilentToolbox |
| 19 | + |
| 20 | +import readme |
| 21 | + |
| 22 | +# Global Parameters |
| 23 | +plt.rcParams['svg.fonttype'] = 'none' |
| 24 | +rstoolbox.utils.format_Ipython() |
| 25 | +``` |
| 26 | + |
| 27 | + |
| 28 | + |
| 29 | + |
| 30 | +<style> |
| 31 | +table.dataframe { |
| 32 | + font-family: monospace; |
| 33 | +} |
| 34 | +</style> |
| 35 | + |
| 36 | + |
| 37 | + |
| 38 | +# Design of a RSVF site II carrier from 1KX8 |
| 39 | + |
| 40 | +> This summary does not track all attempts and variations, just the pathway towards obtaining the designs that were experimentally characterized. |
| 41 | +
|
| 42 | + |
| 43 | +```python |
| 44 | +# Direct information obtain from scoring 1kx8 with Rosetta |
| 45 | +baseline = rstoolbox.io.get_sequence_and_structure(os.path.join('selection', 'baseline', '1kx8.pdb')) |
| 46 | +baseline |
| 47 | +``` |
| 48 | + |
| 49 | + |
| 50 | + |
| 51 | + |
| 52 | +<div> |
| 53 | +<style scoped> |
| 54 | + .dataframe tbody tr th:only-of-type { |
| 55 | + vertical-align: middle; |
| 56 | + } |
| 57 | + |
| 58 | + .dataframe tbody tr th { |
| 59 | + vertical-align: top; |
| 60 | + } |
| 61 | + |
| 62 | + .dataframe thead th { |
| 63 | + text-align: right; |
| 64 | + } |
| 65 | +</style> |
| 66 | +<table border="1" class="dataframe"> |
| 67 | + <thead> |
| 68 | + <tr style="text-align: right;"> |
| 69 | + <th></th> |
| 70 | + <th>score</th> |
| 71 | + <th>fa_atr</th> |
| 72 | + <th>fa_rep</th> |
| 73 | + <th>fa_sol</th> |
| 74 | + <th>fa_intra_rep</th> |
| 75 | + <th>fa_intra_sol_xover4</th> |
| 76 | + <th>lk_ball_wtd</th> |
| 77 | + <th>fa_elec</th> |
| 78 | + <th>pro_close</th> |
| 79 | + <th>hbond_sr_bb</th> |
| 80 | + <th>hbond_lr_bb</th> |
| 81 | + <th>hbond_bb_sc</th> |
| 82 | + <th>hbond_sc</th> |
| 83 | + <th>dslf_fa13</th> |
| 84 | + <th>omega</th> |
| 85 | + <th>fa_dun</th> |
| 86 | + <th>p_aa_pp</th> |
| 87 | + <th>yhh_planarity</th> |
| 88 | + <th>ref</th> |
| 89 | + <th>rama_prepro</th> |
| 90 | + <th>time</th> |
| 91 | + <th>description</th> |
| 92 | + <th>sequence_A</th> |
| 93 | + <th>structure_A</th> |
| 94 | + <th>phi_A</th> |
| 95 | + <th>psi_A</th> |
| 96 | + </tr> |
| 97 | + </thead> |
| 98 | + <tbody> |
| 99 | + <tr> |
| 100 | + <th>0</th> |
| 101 | + <td>165.939</td> |
| 102 | + <td>-594.399</td> |
| 103 | + <td>185.277</td> |
| 104 | + <td>426.021</td> |
| 105 | + <td>1.376</td> |
| 106 | + <td>25.587</td> |
| 107 | + <td>-16.933</td> |
| 108 | + <td>-141.967</td> |
| 109 | + <td>7.165</td> |
| 110 | + <td>-50.138</td> |
| 111 | + <td>-2.655</td> |
| 112 | + <td>-6.671</td> |
| 113 | + <td>-6.171</td> |
| 114 | + <td>-2.659</td> |
| 115 | + <td>0.059</td> |
| 116 | + <td>326.333</td> |
| 117 | + <td>-8.581</td> |
| 118 | + <td>0.0</td> |
| 119 | + <td>16.661</td> |
| 120 | + <td>7.633</td> |
| 121 | + <td>2.0</td> |
| 122 | + <td>1kx8_0001</td> |
| 123 | + <td>NINLDEILANKRLLVAYVNCVMERGKCSPEGKELKEHLQDAIENGCKKCTENQEKGAYRVIEHLIKNEIEIWRELTAKYDPTGNWRKKYEDRAKAAGIVI</td> |
| 124 | + <td>LLLLHHHHHLHHHHHHHHHHHLLLLLLLHHHHHHHHHHHHHHHHLLLLLLHHHHHHHHHHHHHHHHHLHHHHHHHHHHHLLLLLLHHHHHHHHHHHLLLL</td> |
| 125 | + <td>[0.0, -46.7858, -126.674, ...]</td> |
| 126 | + <td>[-42.2254, 137.85, -165.222, ...]</td> |
| 127 | + </tr> |
| 128 | + </tbody> |
| 129 | +</table> |
| 130 | +</div> |
| 131 | + |
| 132 | + |
| 133 | + |
| 134 | +## Making the designs |
| 135 | + |
| 136 | +The construction of the **1kx8**-derived designs implies the grafting to RSVF's site II as represented in [3ixt.pdb](design/3ixt.pdb) without its neutralizing antibody. |
| 137 | + |
| 138 | +The process was performed in a two-generation step. |
| 139 | + |
| 140 | +### Step 1 |
| 141 | + |
| 142 | +Site II was grafted into **1kx8** by means of the _NubInitioMover_ and the sequence space after folding was explored with _FastDesign_. All within the RosettaScript [fold_design.xml](design/fold_design.xml) into a [SLURM](https://slurm.schedmd.com/)-based cluster through the submiter script [submit_gen1.sh](design/submit_gen1.sh). |
| 143 | + |
| 144 | +A total of 12483 decoys were generated. The aim of this firts run was to explore and find a folded conformation that would: |
| 145 | + |
| 146 | +* carry and stabilize at backbone level site II. |
| 147 | +* fold back to a conformation close to **1kx8** keeping the proper beta pairing. |
| 148 | + |
| 149 | +From all the decoys, [188_1kx8_0033](design/188_1kx8_0033.pdb) was selected as seed for the next step of the process. The values of this decoy in the context of the design population are marked with a red line. |
| 150 | + |
| 151 | + |
| 152 | +```python |
| 153 | +step1 = rstoolbox.io.parse_rosetta_file('design/1kx8_silent.minisilent.gz') |
| 154 | +readme.plot_step1(step1) |
| 155 | +``` |
| 156 | + |
| 157 | + |
| 158 | + |
| 159 | + |
| 160 | + |
| 161 | +### Step 2 |
| 162 | + |
| 163 | +The second generation derives from [188_1kx8_0033](design/188_1kx8_0033.pdb) and basically runs the same conditions but using this decoy instead of **1kx8** as template. |
| 164 | + |
| 165 | +The executed script is still [fold_design.xml](design/fold_design.xml), but the submiter script is [submit_gen2.sh](design/submit_gen2.sh). |
| 166 | + |
| 167 | +A total of 12493 decoys were generated. |
| 168 | + |
| 169 | +From all the decoys, the top 500 best scorers were evaluated in terms of packing, BUNS and secondary structure divergence form the starting decoy with the [fastrelax_cav_vol_buns.xml](design/fastrelax_cav_vol_buns.xml) RosettaScript after global relaxation. The six decoys with the best behaviour after evaluating this parameters and some visual inspection became the seed for the seven desings of **generation 1**. The values for those designs are highlighted in the distributions in red. |
| 170 | + |
| 171 | + |
| 172 | +```python |
| 173 | +step2 = rstoolbox.io.parse_rosetta_file('design/1kx8_silent2.minisilent.gz') |
| 174 | +readme.plot_step2(step2) |
| 175 | +``` |
| 176 | + |
| 177 | + |
| 178 | + |
| 179 | + |
| 180 | + |
| 181 | + |
| 182 | +```python |
| 183 | +step3 = rstoolbox.io.parse_rosetta_file('design/top500score.silent') |
| 184 | +readme.plot_step3(step3) |
| 185 | +``` |
| 186 | + |
| 187 | + |
| 188 | + |
| 189 | + |
| 190 | + |
| 191 | +### Generation 1 |
| 192 | + |
| 193 | +The seven designs of **generation 1** derive from the 6 selected from **step 3** after human-guided design (mutations were selected and imposed manually). |
| 194 | + |
| 195 | +### Generation 2 |
| 196 | + |
| 197 | +The eight designs of **generation 2** derive from disulfidized versions of **generation 1** with automatic mutations added to fit the disulfides. |
| 198 | + |
| 199 | + |
| 200 | +Data from those two generations is discussed in the paper. |
| 201 | + |
| 202 | +# Experimental Data |
| 203 | + |
| 204 | + |
| 205 | +```python |
| 206 | +designs = readme.load_experimental() |
| 207 | +readme.firstgen_plot(designs) |
| 208 | +``` |
| 209 | + |
| 210 | + |
| 211 | + |
| 212 | + |
| 213 | + |
| 214 | + |
| 215 | +```python |
| 216 | +readme.secondgen_plot(designs) |
| 217 | +``` |
| 218 | + |
| 219 | + |
| 220 | + |
| 221 | + |
0 commit comments