src/introduction/main.tex

   1 \chapter{Introduction}
   2 \label{sec:intro}
   3
   4 \section{The Protein Folding Problem}
   5 \label{sec:folding-problem}
   6
   7 % Why study protein folding?
   8 In biological systems the most important molecules, such as proteins,
   9 nucleic acids, and polysaccharides, are all polymers.  Understanding
  10 the properties and functions of these polymeric molecules is crucial
  11 in understanding the molecular mechanisms behind structures and
  12 processes in cells.
  13
  14 % What do genes do?  Why is protein folding interesting?
  15 An organism's genetic code is stored in DNA%
  16 \nomenclature{DNA}{Deoxyribonucleic Acid}
  17 in the cell nucleus.
  18 DNA sequencing is a fairly well developed field, with fundamental work
  19 such as the Human Genome Project seeing major development in the early
  20 2000s\citep{wolfsberg01,mcpherson01,collins03}.  It is estimated that
  21 human genetic information contains approximately 25,000 genes, each
  22 encoding a protein\citep{claverie01,venter01}.  Knowing the amino acid
  23 sequence for a particular protein, however, does not immediately shed
  24 light on the protein's role in the body, or even the protein's
  25 probable conformation.  Indeed, a protein's conformation is often
  26 vitally important in executing its biological tasks
  27 (\cref{fig:ligand-receptor}).  Unfortunately both predicting stable
  28 conformations of a given amino acid sequence and the inverse problem
  29 of finding sequences that form a given conformation have proven
  30 remarkably difficult.
  31
  32 \begin{figure}
  33   \begin{center}
  34   \includegraphics[width=2in]{figures/biotin-streptavidin/1SWE.png}%
  35   \caption{Complex of biotin\index{biotin} (red) and a
  36     streptavidin\index{streptavidin} tetramer (green)
  37     (\href{http://dx.doi.org/10.2210/pdb1swe/pdb}{PDB ID: 1SWE})%
  38     \citep{freitag97}.  The correct streptavidin conformation creates
  39     the biotin-specific binding pockets.  Biotin-streptavidin is a
  40     model ligand-receptor pair isolated from the bacterium
  41     \species{Streptomyces avidinii}%
  42     \index{Streptomyces@\species{Streptomyces avidnii}}.  Streptavidin
  43     binds to cell surfaces, and bound biotin increases streptavidin's
  44     cell-binding affinity\citep{alon90}.  Figure generated with
  45     \citetalias{pymol}.
  46     \label{fig:ligand-receptor}}
  47   \end{center}
  48 \end{figure}
  49
  50
  51 \section{Protein Folding Energy Landscapes}
  52 \label{sec:energy-landscape}
  53
  54 % the free energy landscape
  55 Folding a protein via a brute force sampling of all possible
  56 conformations is impossibly inefficient, due to the exponential
  57 scaling of possible conformations with protein length, as outlined by
  58 \citet{levinthal69}.  This has lead to a succession of models
  59 explaining the folding mechanism.  For a number of years, the
  60 ``pathway'' model of protein folding enjoyed popularity
  61 (\cref{fig:folding:pathway})\citep{levinthal69}.  More recently, the
  62 ``landscape'' or ``funnel'' model has come to the fore
  63 (\cref{fig:folding:landscape})\citep{dill97}.
  64
  65 \begin{figure}
  66   \begin{center}
  67   \subfloat[][]{
  68     \begin{tikzpicture}[->,node distance=1.5cm]
  69       \tikzstyle{every state}=[draw=white]
  70       \node[state] (U)                 {$U$};
  71       \node[state] (I1)  [right of=U]  {$I_1$};
  72       \node[state] (I1X) [below of=I1] {$I_1^X$};
  73       \node[state] (I2)  [right of=I1] {$I_2$};
  74       \node[state] (I2X) [below of=I2] {$I_2^X$};
  75       \node[state] (N)   [right of=I2] {$N$};
  76
  77       \path[<->] (U)  edge (I1)
  78                  (I1) edge (I1X)
  79                  (I1) edge (I2)
  80                  (I2) edge (I2X)
  81                  (I2) edge (N);
  82     \end{tikzpicture}\label{fig:folding:pathway}}
  83   % \hspace{.25in}%
  84   \subfloat[][]{\includegraphics[width=2in]{figures/schematic/dill97-fig4}%
  85     \label{fig:folding:landscape}}
  86   \caption{\subref{fig:folding:pathway} A ``double T'' example of the
  87     pathway model of protein folding, in which the protein proceeds
  88     from the native state $N$ to the unfolded state $U$ via a series
  89     of metastable transition states $I_1$ and $I_2$ with two ``dead
  90     end'' states $I_1^X$ and $I_2^X$.  Adapted from \citet{bedard08}.
  91     \subref{fig:folding:landscape} The landscape model of protein
  92     folding, in which the protein diffuses through a multi-dimensional
  93     free energy landscape.  Separate folding attempts may take many
  94     distinct routes through this landscape on the way to the folded
  95     state.  Reproduced from \citet{dill97}.
  96     \label{fig:folding}}
  97   \end{center}
  98 \end{figure}
  99
 100 When the choice of theoretical approach becomes murky, you must gather
 101 experimental data to help distinguish between similar models.
 102 Separating the pathway model from the funnel model is only marginally
 103 withing the realm of current experimental techniques, but with higher
 104 throughput and increased automation it should be easier to make such
 105 distinctions in the near future.
 106
 107
 108 \section{Single Molecule Protein Folding Studies}
 109 \label{sec:single-molecule}
 110
 111 The large size of proteins relative to simpler molecules imposes
 112 certain limitations on the information attainable from bulk
 113 measurements, because the macromolecules in a population can have
 114 diverse conformations and behaviors.  Bulk measurements average over
 115 these differences, producing excellent statistics for the mean, but
 116 making it difficult to understand the variation.  The individualized,
 117 and sometimes rare, behaviors of macromolecules can have important
 118 implications for their functions inside the cell.  Single molecule
 119 techniques, in which the macromolecules are studied one at a time,
 120 allow direct access to the variation within the population without
 121 averaging.  This provides important and complementary information
 122 about the functional mechanisms of several biological
 123 systems\citep{bustamante08}.
 124
 125 Single molecule techniques provide an opportunity to study protein
 126 folding and unfolding at the level of a single molecule, where the
 127 distinction between the pathway model and funnel model is clearer.
 128 They also provide a convenient benchmark for verifying molecular
 129 dynamics simulations, because it takes a quite a bit of computing
 130 power to simulate even one biopolymer with anything close to atomic
 131 resolution over experimental timescales.  Even with significant
 132 computing resources, comparing molecular dynamics results with
 133 experimental data remains elusive.  For example, experimental pulling
 134 speeds are on the order of \bareU{$\mu$m/s}, while simulation pulling
 135 speeds are on the order of
 136 \bareU{m/s}\citep{lu98,lu99,rief02,zhao06,berkemeier11}.
 137
 138 % why AFM & what an AFM is
 139 Single molecule techniques for manipulating biopolymers include
 140 optical measurements, \ie, single molecule fluorescence microscopy and
 141 spectroscopy, and mechanical manipulations of individual
 142 macromolecules, \ie, force microscopy and spectroscopy using atomic
 143 force microscopes (AFMs), laser tweezers\citep{kellermayer97,forde02},
 144 magnetic tweezers\citep{smith92}, biomembrane force
 145 probes\citep{merkel99}, and centrifugal
 146 microscopes\citep{halvorsen09}.  These techniques cover a wide range
 147 of approaches, and even when the basic approach is the same
 148 (e.g.\ force microscopy), the different techniques span orders of
 149 magnitude in the range of their controllable parameters.
 150 \nomenclature{AFM}{Atomic Force Microscope (or Microscopy)}
 151
 152
 153 \section{Thesis Outline}
 154 \label{sec:outline}
 155
 156 TODO: fill in once structure has stabilized
 157
 158 %\Cref{sec:unfolding} of this thesis discusses the theory of protein
 159 %unfolding for single domains.  \Cref{sec:tension} discusses linker
 160 %tension modeling.  \Cref{sec:unfolding-distributions} pulls
 161 %\cref{sec:unfolding,sec:tension} together to discuss the theory of
 162 %mechanical unfolding experiments.  This theory makes straightforward
 163 %analysis of unfolding results difficult, so \cref{sec:sawsim} presents
 164 %a Monte Carlo simulation approach to fitting unfolding parameters, and
 165 %\cref{sec:contour-space} presents the contour-length space analysis
 166 %for converting force curves to unfolding pathway fingerprints.
 167 %\Cref{sec:temperature-theory} wraps up the theory section by extending
 168 %the analysis in \cref{sec:unfolding,sec:unfolding-distributions} to
 169 %multiple temperatures.
 170 %
 171 %\Cref{sec:apparatus} describes our experimental apparatus and methods,
 172 %as well as calibration procedures.  With both the theory and procedure
 173 %taken care of, \cref{sec:cantilever,sec:temperature}
 174 %present and analyze AFM cantilever- and temperature-dependent
 175 %unfolding behavior of the immunoglobulin-like domain 27 from human
 176 %Titin (I27).
 177 %
 178 %We close with \cref{sec:future}, which presents our conclusions and
 179 %discusses possible directions for future work.