Compare theory vs. sim scaled by bin width (not theory, which may be zero).

[sawsim.git] / pysawsim / parameter_scan.py
diff --git a/pysawsim/parameter_scan.py b/pysawsim/parameter_scan.py

index 4e11c6ab97ccac0466b9dadeb7dd437ee81525f7..3d6e99bbed6c42977dde1c7ea369fe5accdfd356 100644 (file)
--- a/pysawsim/parameter_scan.py
+++ b/pysawsim/parameter_scan.py
@@ -36,6 +36,10 @@ from .sawsim_histogram import sawsim_histogram
  from .sawsim import SawsimRunner
  
  
+_multiprocess_can_split_ = True
+"""Allow nosetests to split tests between processes.
+"""
+
  FIGURE = pylab.figure()  # avoid memory problems.
  """`pylab` keeps internal references to all created figures, so share
  a single instance.
@@ -146,21 +150,21 @@ class HistogramMatcher (object):
      unique to that experiment.
  
      >>> from .manager.thread import ThreadManager
-    >>> velocity_stream = StringIO(EXAMPLE_HISTOGRAM_FILE_CONTENTS)
+    >>> histogram_stream = StringIO(EXAMPLE_HISTOGRAM_FILE_CONTENTS)
      >>> param_format_string = (
      ...     '-s cantilever,hooke,0.05 -N1 '
      ...     '-s folded,null -N8 '
      ...     '-s "unfolded,wlc,{0.39e-9,28e-9}" '
      ...     '-k "folded,unfolded,bell,{%g,%g}" -q folded')
      >>> m = ThreadManager()
-    >>> sr = SawsimRunner(sawsim='bin/sawsim', manager=m)
-    >>> hm = HistogramMatcher(velocity_stream, param_format_string, sr, N=3)
+    >>> sr = SawsimRunner(manager=m)
+    >>> hm = HistogramMatcher(histogram_stream, param_format_string, sr, N=3)
      >>> hm.plot([[1e-5,1e-3,3],[0.1e-9,1e-9,3]], logx=True, logy=False)
      >>> m.teardown()
      """
      def __init__(self, histogram_stream, param_format_string,
                   sawsim_runner, N=400, residual_type='jensen-shannon',
-                 plot=True):
+                 plot=False):
          self.experiment_histograms = self._read_force_histograms(
              histogram_stream)
          self.param_format_string = param_format_string
@@ -172,9 +176,13 @@ class HistogramMatcher (object):
      def _read_force_histograms(self, stream):
          """
          File format:
-        # comment and blank lines ignored
-        <velocity in m/s><whitespace><path to histogram file>
-        ...
+
+          # comment and blank lines ignored
+          #HISTOGRAM: <histogram-specific params>
+          <pysawsim.histogram.Histogram-compatible histogram>
+          #HISTOGRAM: <other histogram-specific params>
+          <another pysawsim.histogram.Histogram-compatible histogram>
+          ...
  
          >>> import sys
          >>> stream = StringIO(EXAMPLE_HISTOGRAM_FILE_CONTENTS)
@@ -233,21 +241,7 @@ class HistogramMatcher (object):
          return '%s %s' % (
              self.param_format_string % tuple(params), hist_params)
  
-    def get_all_unfolding_data(self, dirname, velocity_string):
-        datafile = os.path.join(dirname, "data_" + velocity_string)
-        return numpy.fromfile(datafile, sep=" ")
-
-        sawsim_histograms = {}
-        for velocity in velocities:
-            unfolding_forces = self.get_all_unfolding_data(dirname, str(velocity))
-            bin_edges = histograms[velocity].bin_edges
-            h = Histogram()
-            h.from_data(unfolding_forces, bin_edges)
-            sawsim_histograms[velocity] = h
-            sawsim_histograms[velocity].normalize()
-        return sawsim_histograms
-
-    def _residual(self, params):
+    def residual(self, params):
          residual = 0
          for hist_params,experiment_hist in self.experiment_histograms.iteritems():
              sawsim_hist = sawsim_histogram(
@@ -263,7 +257,7 @@ class HistogramMatcher (object):
                  self._plot_residual_comparison(
                      experiment_hist, sawsim_hist, residual=r,
                      title=title, filename=filename)
-        log().debug('residual: %g' % residual)
+        log().debug('residual %s: %g' % (params, residual))
          return residual
  
      def plot(self, param_ranges, logx=False, logy=False, contour=False):
@@ -286,7 +280,7 @@ class HistogramMatcher (object):
                  log().info('point %d %d (%d of %d)'
                             % (i, j, i*(len(y)-1) + j, (len(x)-1)*(len(y)-1)))
                  params = (xi,yj)
-                r = self._residual(params)
+                r = self.residual(params)
                  C[j,i] = numpy.log(r) # better resolution in valleys
                  if MEM_DEBUG == True:
                      log().debug('RSS: %d KB' % rss())
@@ -333,6 +327,8 @@ def parse_param_ranges_string(string):
  
      >>> parse_param_ranges_string('[1,2,3],[4,5,6]')
      [[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]]
+    >>> parse_param_ranges_string('[1,2,3]')
+    [[1.0, 2.0, 3.0]]
      """
      ranges = []
      for range_string in string.split("],["):
@@ -347,8 +343,7 @@ def main(argv=None):
      >>> f = tempfile.NamedTemporaryFile()
      >>> f.write(EXAMPLE_HISTOGRAM_FILE_CONTENTS)
      >>> f.flush()
-    >>> main(['-s', 'bin/sawsim',
-    ...       '-r', '[1e-5,1e-3,3],[0.1e-9,1e-9,3]',
+    >>> main(['-r', '[1e-5,1e-3,3],[0.1e-9,1e-9,3]',
      ...       '-N', '2',
      ...       f.name])
      >>> f.close()
@@ -388,45 +383,47 @@ def main(argv=None):
          if option.dest == 'param_string':
              continue
          parser.add_option(option)
-    parser.add_option("-f","--param-format", dest="param_format",
-                      metavar="FORMAT",
-                      help="Convert params to sawsim options (%default).",
+    parser.add_option('-f','--param-format', dest='param_format',
+                      metavar='FORMAT',
+                      help='Convert params to sawsim options (%default).',
                        default=('-s cantilever,hooke,0.05 -N1 -s folded,null -N8 -s "unfolded,wlc,{0.39e-9,28e-9}" -k "folded,unfolded,bell,{%g,%g}" -q folded'))
-    parser.add_option("-p","--initial-params", dest="initial_params",
-                      metavar="PARAMS",
-                      help="Initial params for fitting (%default).",
+    parser.add_option('-p','--initial-params', dest='initial_params',
+                      metavar='PARAMS',
+                      help='Initial params for fitting (%default).',
                        default='3.3e-4,0.25e-9')
-    parser.add_option("-r","--param-range", dest="param_range",
-                      metavar="PARAMS",
-                      help="Param range for plotting (%default).",
+    parser.add_option('-r','--param-range', dest='param_range',
+                      metavar='PARAMS',
+                      help='Param range for plotting (%default).',
                        default='[1e-5,1e-3,20],[0.1e-9,1e-9,20]')
-    parser.add_option("-R","--residual", dest="residual",
-                      metavar="STRING",
-                      help="Residual type (from 'jensen-shannon', 'chi-squared', 'mean', 'std-dev'; default: %default).",
+    parser.add_option('--logx', dest='logx',
+                      help='Use a log scale for the x range.',
+                      default=False, action='store_true')
+    parser.add_option('--logy', dest='logy',
+                      help='Use a log scale for the y range.',
+                      default=False, action='store_true')
+    parser.add_option('-R','--residual', dest='residual',
+                      metavar='STRING',
+                      help='Residual type (from %s; default: %%default).'
+                      % ', '.join(Histogram().types()),
                        default='jensen-shannon')
-    parser.add_option("-P","--plot-residuals", dest="plot_residuals",
-                      help="Generate residual difference plots for each point in the plot range.",
-                      default=False, action="store_true")
-    parser.add_option("--logx", dest="logx",
-                      help="Use a log scale for the x range.",
-                      default=False, action="store_true")
-    parser.add_option("--logy", dest="logy",
-                      help="Use a log scale for the y range.",
-                      default=False, action="store_true")
-    parser.add_option("-c","--contour-plot", dest="contour_plot",
-                      help="Select contour plot (vs. the default pseudocolor plot).",
-                      default=False, action="store_true")
+    parser.add_option('-P','--plot-residuals', dest='plot_residuals',
+                      help='Generate residual difference plots for each point in the plot range.',
+                      default=False, action='store_true')
+    parser.add_option('-c','--contour-plot', dest='contour_plot',
+                      help='Select contour plot (vs. the default pseudocolor plot).',
+                      default=False, action='store_true')
  
      options,args = parser.parse_args(argv)
  
      initial_params = [float(p) for p in options.initial_params.split(",")]
      param_ranges = parse_param_ranges_string(options.param_range)
-    velocity_file = args[0]
+    histogram_file = args[0]
      sr_call_params = sr.initialize_from_options(options)
  
      try:
          hm = HistogramMatcher(
-            file(velocity_file, 'r'), param_format_string=options.param_format,
+            file(histogram_file, 'r'),
+            param_format_string=options.param_format,
              sawsim_runner=sr, residual_type=options.residual,
              plot=options.plot_residuals, **sr_call_params)
          #hm.fit(initial_params)