Changeset 5d4777d – SasView

compare-new.py

-                      rff7119b
+                      r5d4777d
 from sasmodels.bumps_model import BumpsModel, plot_data, tic
+from sasmodels.gen import opencl_model, dll_model
+from sasmodels import gpu, dll
+from sasmodels.convert import revert_model
 def sasview_model(modelname, **pars):
 …
     Load a sasview model given the model name.
     """
     modelname = modelname+"Model"
+    modelname = modelname
     sans = __import__('sans.models.'+modelname)
     ModelClass = getattr(getattr(sans.models,modelname,None),modelname,None)
 …
     sasmodels = __import__('sasmodels.models.'+modelname)
     module = getattr(sasmodels.models, modelname, None)
     kernel = opencl_model(module, dtype=dtype)
+    kernel = gpu.load_model(module, dtype=dtype)
     return kernel
 …
     sasmodels = __import__('sasmodels.models.'+modelname)
     module = getattr(sasmodels.models, modelname, None)
     kernel = dll_model(module, dtype=dtype)
+    kernel = dll.load_model(module, dtype=dtype)
     return kernel
+def compare(Ncpu, cpuname, cpupars, Ngpu, gpuname, gpupars):
+def randomize(p, v):
+    """
+    Randomizing pars using sasview names.
+    Guessing at angles and slds.
+    """
+    if any(p.endswith(s) for s in ('_pd_n','_pd_nsigmas','_pd_type')):
+        return v
+    if any(s in p for s in ('theta','phi','psi')):
+        return np.random.randint(0,90)
+    elif any(s in p for s in ('sld','Sld','SLD')):
+        return np.random.rand()*1e-5
+    else:
+        return np.random.rand()
+def parlist(pars):
+    return "\n".join("%s: %s"%(p,v) for p,v in sorted(pars.items()))
+def suppress_pd(pars):
+    """
+    Suppress theta_pd for now until the normalization is resolved.
+    May also suppress complete polydispersity of the model to test
+    models more quickly.
+    """
+    for p in pars:
+        if p.endswith("_pd"): pars[p] = 0
+def compare(gpuname, gpupars, Ncpu, Ngpu, opts):
     #from sasmodels.core import load_data
     #data = load_data('December/DEC07098.DAT')
+    from sasmodels.core import empty_data1D
+    data = empty_data1D(np.logspace(-4, -1, 128))
+    #from sasmodels.core import empty_2D, set_beam_stop
+    #data = empty_data2D(np.linspace(-0.05, 0.05, 128))
+    #set_beam_stop(data, 0.004)
+    qmax = 1.0 if '-highq' in opts else (0.2 if '-midq' in opts else 0.05)
+    if "-1d" in opts:
+        from sasmodels.bumps_model import empty_data1D
+        qmax = np.log10(qmax)
+        data = empty_data1D(np.logspace(qmax-3, qmax, 128))
+    else:
+        from sasmodels.bumps_model import empty_data2D, set_beam_stop
+        data = empty_data2D(np.linspace(-qmax, qmax, 128))
+        set_beam_stop(data, 0.004)
     is2D = hasattr(data, 'qx_data')
+    dtype = 'double' if '-double' in opts else 'single'
+    cutoff_opts = [s for s in opts if s.startswith('-cutoff')]
+    cutoff = float(cutoff_opts[0].split('=')[1]) if cutoff_opts else 1e-5
+    if '-random' in opts:
+        gpupars = dict((p,randomize(p,v)) for p,v in gpupars.items())
+    if '-pars' in opts: print "pars",parlist(gpupars)
+    if '-mono' in opts: suppress_pd(gpupars)
+    cpuname, cpupars = revert_model(gpuname, gpupars)
+    try:
+        gpumodel = load_opencl(gpuname, dtype=dtype)
+    except Exception,exc:
+        print exc
+        print "... trying again with single precision"
+        gpumodel = load_opencl(gpuname, dtype='single')
+    model = BumpsModel(data, gpumodel, cutoff=cutoff, **gpupars)
     if Ngpu > 0:
-        gpumodel = load_opencl(gpuname, dtype='single')
-        model = BumpsModel(data, gpumodel, **gpupars)
         toc = tic()
         for i in range(Ngpu):
 …
             gpu = model.theory()
         gpu_time = toc()*1000./Ngpu
         print "ocl t=%.1f ms, intensity=%.0f"%(gpu_time, sum(gpu[~np.isnan(gpu)]))
+        print "ocl t=%.1f ms, intensity=%f"%(gpu_time, sum(gpu[~np.isnan(gpu)]))
         #print max(gpu), min(gpu)
+    if 0 and Ncpu > 0: # Hack to compare ctypes vs. opencl
+        dllmodel = load_dll(gpuname, dtype='double')
+        model = BumpsModel(data, dllmodel, **gpupars)
+    comp = None
+    if Ncpu > 0 and "-dll" in opts:
+        dllmodel = load_dll(gpuname, dtype=dtype)
+        model = BumpsModel(data, dllmodel, cutoff=cutoff, **gpupars)
         toc = tic()
         for i in range(Ncpu):
 …
             cpu = model.theory()
         cpu_time = toc()*1000./Ncpu
         print "dll t=%.1f ms"%cpu_time
+        comp = "dll"
     elif 0: # Hack to check new vs old for GpuCylinder
         from Models.code_cylinder_f import GpuCylinder as oldgpu
         from sasmodel import SasModel
         oldmodel = SasModel(data, oldgpu, dtype='single', **cpupars)
+        oldmodel = SasModel(data, oldgpu, dtype=dtype, **cpupars)
         toc = tic()
         for i in range(Ngpu):
 …
             cpu = oldmodel.theory()
         cpu_time = toc()*1000./Ngpu
         print "old t=%.1f ms"%cpu_time
+        comp = "old"
     elif Ncpu > 0:
 …
                 cpu = cpumodel.evalDistribution(data.x)
         cpu_time = toc()*1000./Ncpu
+        print "sasview t=%.1f ms, intensity=%.0f"%(cpu_time, sum(cpu[model.index]))
+        comp = 'sasview'
+        #print "sasview t=%.1f ms, intensity=%.0f"%(cpu_time, sum(cpu[model.index]))
+    if comp:
+        print "%s t=%.1f ms, intensity=%f"%(comp, cpu_time, sum(cpu[model.index]))
     if Ngpu > 0 and Ncpu > 0:
+        print "gpu/cpu", max(abs(gpu/cpu)), "%.15g"%max(abs(gpu)), "%.15g"%max(abs(cpu))
+        #print "speedup %.2g"%(cpu_time/gpu_time)
+        #print "max |gpu/cpu|", max(abs(gpu/cpu)), "%.15g"%max(abs(gpu)), "%.15g"%max(abs(cpu))
         #cpu *= max(gpu/cpu)
+        abserr = (gpu - cpu)
+        relerr = (gpu - cpu)/cpu
+        print "max(|ocl-omp|)", max(abs(abserr[model.index]))
+        print "max(|(ocl-omp)/ocl|)", max(abs(relerr[model.index]))
+    #return
+        resid, relerr = np.zeros_like(gpu), np.zeros_like(gpu)
+        resid[model.index] = (gpu - cpu)[model.index]
+        relerr[model.index] = resid[model.index]/cpu[model.index]
+        print "max(|ocl-%s|)"%comp, max(abs(resid[model.index]))
+        print "max(|(ocl-%s)/ocl|)"%comp, max(abs(relerr[model.index]))
+    if '-noplot' in opts: return
     import matplotlib.pyplot as plt
 …
         if Ngpu > 0: plt.subplot(131)
         plot_data(data, cpu, scale='log')
         plt.title("omp t=%.1f ms"%cpu_time)
+        plt.title("%s t=%.1f ms"%(comp,cpu_time))
     if Ngpu > 0:
         if Ncpu > 0: plt.subplot(132)
 …
     if Ncpu > 0 and Ngpu > 0:
         plt.subplot(133)
+        plot_data(data, 1e8*relerr, scale='linear')
+        plt.title("max rel err = %.3g"%max(abs(relerr)))
+        err = resid if '-abs' in opts else relerr
+        plot_data(data, err, scale='linear')
+        plt.title("max rel err = %.3g"%max(abs(err[model.index])))
         if is2D: plt.colorbar()
     plt.show()
-def rename(pars, **names):
-    newpars = pars.copy()
-    for new,old in names.items():
-        for variant in ("", "_pd", "_pd_n", "_pd_nsigma"):
-            if old+variant in newpars:
-                newpars[new+variant] = pars[old+variant]
-                del newpars[old+variant]
-    return newpars
-def rescale_sld(pars, names):
-    newpars = pars.copy()
-    for p in names:
-        newpars[p] *= 1e6
-    return newpars
 # ===========================================================================
+#
+USAGE="""
+usage: compare.py model [Nopencl] [Nsasview] [options...] [key=val]
+Compare the speed and value for a model between the SasView original and the
+OpenCL rewrite.
+model is the name of the model to compare (see below).
+Nopencl is the number of times to run the OpenCL model (default=5)
+Nsasview is the number of times to run the Sasview model (default=1)
+Options (* for default):
+    -plot*/-noplot plots or suppress the plot of the model
+    -single/-double uses double precision for comparison
+    -lowq/-midq/-highq use q values up to 0.05, 0.2 or 1.0
+    -2d/-1d uses 1d or 2d random data
+    -preset/-random randomizes the parameters
+    -poly/-mono force monodisperse/polydisperse
+    -sasview/-dll whether cpu is tested using sasview or dll
+    -cutoff=1e-5/value cutoff for including a point in polydispersity
+    -nopars/-pars prints the parameter set or not
+    -rel/-abs plot relative or absolute error
+Key=value pairs allow you to set specific values to any of the model
+parameters.
+Available models:
+    %s
+"""
+def main():
+    opts = [arg for arg in sys.argv[1:] if arg.startswith('-')]
+    args = [arg for arg in sys.argv[1:] if not arg.startswith('-')]
+    models = "\n    ".join("%-7s: %s"%(k,v.__name__.replace('_',' '))
+                           for k,v in sorted(MODELS.items()))
+    if len(args) == 0:
+        print(USAGE%models)
+        sys.exit(1)
+    if args[0] not in MODELS:
+        print "Model %r not available. Use one of:\n    %s"%(args[0],models)
+        sys.exit(1)
+    name, pars = MODELS[args[0]]()
+    Nopencl = int(args[1]) if len(args) > 1 else 5
+    Nsasview = int(args[2]) if len(args) > 3 else 1
+    # Fill in default polydispersity parameters
+    pds = set(p.split('_pd')[0] for p in pars if p.endswith('_pd'))
+    for p in pds:
+        if p+"_pd_nsigma" not in pars: pars[p+"_pd_nsigma"] = 3
+        if p+"_pd_type" not in pars: pars[p+"_pd_type"] = "gaussian"
+    # Fill in parameters given on the command line
+    for arg in args[3:]:
+        k,v = arg.split('=')
+        if k not in pars:
+            # extract base name without distribution
+            # style may be either a.d or a_pd_d
+            s = set((p.split('_pd')[0]).split('.')[0] for p in pars)
+            print "%r invalid; parameters are: %s"%(k,", ".join(sorted(s)))
+            sys.exit(1)
+        pars[k] = float(v) if not v.endswith('type') else v
+    compare(name, pars, Nsasview, Nopencl, opts)
+# ===========================================================================
+#
 MODELS = {}
 def model(name):
 …
     return gather_function
-USAGE="""
-usage: compare model [Nopencl] [Nsasview]
-Compare the speed and value for a model between the SasView original and the
-OpenCL rewrite.
-* Nopencl is the number of times to run the OpenCL model (default=5)
-* Nsasview is the number of times to run the Sasview model (default=1)
-* model is the name of the model to compare:
-    %s
-"""
-def main():
-    if len(sys.argv) == 1:
-        models = "\n    ".join("%-7s: %s"%(k,v.__name__.replace('_',' '))
-                               for k,v in sorted(MODELS.items()))
-        print(USAGE%models)
-        sys.exit(1)
-    cpuname, cpupars, gpuname, gpupars = MODELS[sys.argv[1]]()
-    Nopencl = int(sys.argv[2]) if len(sys.argv) > 2 else 5
-    Nsasview = int(sys.argv[3]) if len(sys.argv) > 3 else 1
-    compare(Nsasview, cpuname, cpupars, Nopencl, gpuname, gpupars)
 @model('cyl')
 def cylinder():
+    cpupars = dict(
+        scale=.003, background=.1,
+        sldCyl=.291e-6, sldSolv=5.77e-6,
+        radius=264.1, length=66.96,
+        cyl_theta=85, cyl_phi=0,
+        radius_pd=0.1, radius_pd_n=10, radius_pd_nsigma=3,
+        length_pd=0.1,length_pd_n=1, length_pd_nsigma=3,
+        cyl_theta_pd=45, cyl_theta_pd_n=50, cyl_theta_pd_nsigma=3,
+        cyl_phi_pd=0.1, cyl_phi_pd_n=5, cyl_phi_pd_nsigma=3,
+        )
+    cpuname = 'Cylinder'
+    gpupars = rename(cpupars, theta='cyl_theta', phi='cyl_phi', sld='sldCyl', solvent_sld='sldSolv')
+    gpupars = rescale_sld(gpupars, ['sld', 'solvent_sld'])
+    gpuname = 'cylinder'
+    return cpuname, cpupars, gpuname, gpupars
+    pars = dict(
+        scale=1, background=0,
+        sld=6e-6, solvent_sld=1e-6,
+        #radius=5, length=20,
+        radius=260, length=290,
+        theta=30, phi=15,
+        radius_pd=.2, radius_pd_n=1,
+        length_pd=.2,length_pd_n=1,
+        theta_pd=15, theta_pd_n=25,
+        phi_pd=15, phi_pd_n=1,
+        )
+    return 'cylinder', pars
+@model('capcyl')
+def capped_cylinder():
+    pars = dict(
+        scale=1, background=0,
+        sld=6e-6, solvent_sld=1e-6,
+        radius=260, cap_radius=80000, length=290,
+        theta=30, phi=15,
+        radius_pd=.2, radius_pd_n=1,
+        cap_radius_pd=.2, cap_radius_pd_n=1,
+        length_pd=.2, length_pd_n=1,
+        theta_pd=15, theta_pd_n=25,
+        phi_pd=15, phi_pd_n=1,
+        )
+    return 'capped_cylinder', pars
+@model('cscyl')
+def core_shell_cylinder():
+    pars = dict(
+        scale=1, background=0,
+        core_sld=6e-6, shell_sld=8e-6, solvent_sld=1e-6,
+        radius=325, thickness=25, length=34.2709,
+        theta=90, phi=0,
+        radius_pd=0.1, radius_pd_n=10,
+        length_pd=0.1, length_pd_n=5,
+        thickness_pd=0.1, thickness_pd_n=5,
+        theta_pd=15.8, theta_pd_n=5,
+        phi_pd=0.0008748, phi_pd_n=5,
+        )
+    return 'core_shell_cylinder', pars
 @model('ell')
+def ellipse():
+    pars = dict(
+        scale=.027, background=4.9,
+        sldEll=.297e-6, sldSolv=5.773e-6,
+        radius_a=60, radius_b=180,
+        axis_theta=0, axis_phi=90,
+        radius_a_pd=0.1, radius_a_pd_n=10, radius_a_pd_nsigma=3,
+        radius_b_pd=0.1, radius_b_pd_n=10, radius_b_pd_nsigma=3,
+        axis_theta_pd=0.1, axis_theta_pd_n=6, axis_theta_pd_nsigma=3,
+        axis_phi_pd=0.1, axis_phi_pd_n=6, axis_phi_pd_nsigma=3,
+        )
+    from Models.code_ellipse import GpuEllipse as gpumodel
+    model = sasview_model('Ellipsoid', **pars)
+    pars = rename(pars, theta='axis_theta', phi='axis_phi', sld='sldEll', solvent_sld='sldSolv')
+    pars = rescale_sld(pars, ['sld', 'solvent_sld'])
+    return model, gpumodel, pars
+@model('cscyl')
+def core_shell_cylinder(N=1):
+    pars = dict(
+        scale= 1.77881e-06, background=223.827,
+        core_sld=1e-6, shell_sld=.291e-6, solvent_sld=7.105e-6,
+        radius=325, thickness=25, length=34.2709,
+        axis_theta=90, axis_phi=0,
+        radius_pd=0.1, radius_pd_n=10, radius_pd_nsigma=3,
+        length_pd=0.1, length_pd_n=10, length_pd_nsigma=3,
+        thickness_pd=0.1, thickness_pd_n=5, thickness_pd_nsigma=3,
+        axis_theta_pd=15.8, axis_theta_pd_n=20, axis_theta_pd_nsigma=5,
+        axis_phi_pd=0.0008748, axis_phi_pd_n=5, axis_phi_pd_nsigma=3,
+        )
+    model = sasview_model('CoreShellCylinder', **pars)
+    from Models.code_coreshellcyl_f import GpuCoreShellCylinder as gpumodel
+    pars = rename(pars, theta='axis_theta', phi='axis_phi')
+    pars = rescale_sld(pars, ['core_sld', 'shell_sld', 'solvent_sld'])
+    return model, gpumodel, pars
+def ellipsoid():
+    pars = dict(
+        scale=1, background=0,
+        sld=6e-6, solvent_sld=1e-6,
+        rpolar=50, requatorial=30,
+        theta=0, phi=0,
+        rpolar_pd=0.3, rpolar_pd_n=10,
+        requatorial_pd=0, requatorial_pd_n=10,
+        theta_pd=0, theta_pd_n=45,
+        phi_pd=0, phi_pd_n=45,
+        )
+    return 'ellipsoid', pars
 @model('ell3')
+def triaxial_ellipse(N=1):
+    pars = dict(
+        scale=0.08, background=5,
+        sldEll=7.105e-6, sldSolv=.291e-6,
+        axis_theta=0, axis_phi=0, axis_psi=0,
+        semi_axisA=15, semi_axisB=20, semi_axisC=500,
+        axis_theta_pd=20, axis_theta_pd_n=10, axis_theta_pd_nsigma=3,
+        axis_phi_pd=.1, axis_phi_pd_n=10, axis_phi_pd_nsigma=3,
+        axis_psi_pd=30, axis_psi_pd_n=5, axis_psi_pd_nsigma=3,
+        semi_axisA_pd=.1, semi_axisA_pd_n=5, semi_axisA_pd_nsigma=3,
+        semi_axisB_pd=.1, semi_axisB_pd_n=5, semi_axisB_pd_nsigma=3,
+        semi_axisC_pd=.1, semi_axisC_pd_n=5, semi_axisC_pd_nsigma=3,
+        )
+    model = sasview_model('TriaxialEllipsoid', **pars)
+    from Models.code_triaxialellipse import GpuTriEllipse as gpumodel
+    pars = rename(pars,
+                  theta='axis_theta', phi='axis_phi', psi='axis_psi',
+                  sld='sldEll', solvent_sld='sldSolv',
+                  radius_a='semi_axisA', radius_b='semi_axisB',
+                  radius_c='semi_axisC',
+                  )
+    pars = rescale_sld(pars, ['sld', 'solvent_sld'])
+    return model, gpumodel, pars
+def triaxial_ellipsoid():
+    pars = dict(
+        scale=1, background=0,
+        sld=6e-6, solvent_sld=1e-6,
+        theta=0, phi=0, psi=0,
+        req_minor=25, req_major=36, rpolar=50,
+        theta_pd=0, theta_pd_n=5,
+        phi_pd=0, phi_pd_n=5,
+        psi_pd=0, psi_pd_n=5,
+        req_minor_pd=0, req_minor_pd_n=5,
+        req_major_pd=0, req_major_pd_n=5,
+        rpolar_pd=.3, rpolar_pd_n=25,
+        )
+    return 'triaxial_ellipsoid', pars
+@model('sph')
+def sphere():
+    pars = dict(
+        scale=1, background=0,
+        sld=6e-6, solvent_sld=1e-6,
+        radius=120,
+        radius_pd=.3, radius_pd_n=5,
+        )
+    return 'sphere', pars
 @model('lam')
+def lamellar(N=1):
+    pars = dict(
+        scale=0.08, background=0.003,
+        sld_bi=5.38e-6,sld_sol=7.105e-6,
+        bi_thick=19.2946,
+        bi_thick_pd= 0.37765, bi_thick_pd_n=40, bi_thick_pd_nsigma=3,
+        )
+    model = sasview_model('Lamellar', **pars)
+    from Models.code_lamellar import GpuLamellar as gpumodel
+    pars = rename(pars, sld='sld_bi', solvent_sld='sld_sol', thickness='bi_thick')
+    pars = rescale_sld(pars, ['sld', 'solvent_sld'])
+    return model, gpumodel, pars
+@model('capcyl')
+def capped_cylinder(N=1):
+    pars = dict(
+        scale=.08, background=0,
+        sld_capcyl=1e-6, sld_solv=6.3e-6,
+        rad_cyl=20, rad_cap=40, len_cyl=400,
+        theta=0, phi=0,
+        rad_cyl_pd=.1, rad_cyl_pd_n=10, rad_cyl_pd_nsigma=3,
+        rad_cap_pd=.1, rad_cap_pd_n=10, rad_cap_pd_nsigma=3,
+        len_cyl_pd=.1, len_cyl_pd_n=3, len_cyl_pd_nsigma=3,
+        theta_pd=.1, theta_pd_n=3, theta_pd_nsigma=3,
+        phi_pd=.1, phi_pd_n=3, phi_pd_nsigma=3,
+        )
+    model = sasview_model('CappedCylinder', **pars)
+    from Models.code_capcyl import GpuCapCylinder as gpumodel
+    pars = rename(pars,
+                  sld='sld_capcyl', solvent_sld='sld_solv',
+                  length='len_cyl', radius='rad_cyl',
+                  cap_radius='rad_cap')
+    pars = rescale_sld(pars, ['sld', 'solvent_sld'])
+    return model, gpumodel, pars
+def lamellar():
+    pars = dict(
+        scale=1, background=0,
+        sld=6e-6, solvent_sld=1e-6,
+        thickness=40,
+        thickness_pd= 0.3, thickness_pd_n=40,
+        )
+    return 'lamellar', pars
 if __name__ == "__main__":

sasmodels/bumps_model.py

-                      rff7119b
+                      r5d4777d
     import matplotlib.pyplot as plt
     if hasattr(data, 'qx_data'):
+        img = masked_array(iq, data.mask)
+        iq = iq[:]
+        valid = np.isfinite(iq)
         if scale == 'log':
+            img[(img <= 0) | ~np.isfinite(img)] = masked
+            img = np.log10(img)
+            valid[valid] = (iq[valid] > 0)
+            iq[valid] = np.log10(iq[valid])
+        iq[~valid|data.mask] = 0
+        #plottable = iq
+        plottable = masked_array(iq, ~valid|data.mask)
         xmin, xmax = min(data.qx_data), max(data.qx_data)
         ymin, ymax = min(data.qy_data), max(data.qy_data)
         plt.imshow(img.reshape(128,128),
+        plt.imshow(plottable.reshape(128,128),
                    interpolation='nearest', aspect=1, origin='upper',
                    extent=[xmin, xmax, ymin, ymax], vmin=vmin, vmax=vmax)
 …
             plt.plot(data.x[idx], iq[idx])
         else:
+            idx = np.isfinite(iq) & (iq>0)
+            idx = np.isfinite(iq)
+            idx[idx] = (iq[idx]>0)
             plt.loglog(data.x[idx], iq[idx])
 …
     def __init__(self, data, model, cutoff=1e-5, **kw):
         from bumps.names import Parameter
+        partype = model.info['partype']
         # interpret data
 …
             self.diq = data.err_data[self.index]
             self._theory = np.zeros_like(data.data)
+            q_vectors = [data.qx_data, data.qy_data]
+            if not partype['orientation'] and not partype['magnetic']:
+                q_vectors = [np.sqrt(data.qx_data**2+data.qy_data**2)]
+            else:
+                q_vectors = [data.qx_data, data.qy_data]
         else:
             self.index = (data.x>=data.qmin) & (data.x<=data.qmax) & ~np.isnan(data.y)
 …
             setattr(self, name, Parameter.default(value, name=name, limits=limits))
             pars.append(name)
         for name in model.info['partype']['pd-2d']:
+        for name in partype['pd-2d']:
             for xpart,xdefault,xlimits in [
                     ('_pd', 0, limits),

sasmodels/dll.py

-                      rff7119b
+                      r5d4777d
 C types wrapper for sasview models.
 """
+import sys
+import os
 import ctypes as ct
 from ctypes import c_void_p, c_int, c_double
 …
 from .gen import F32, F64
+# Compiler platform details
+if sys.platform == 'darwin':
+    COMPILE = "gcc-mp-4.7 -shared -fPIC -std=c99 -fopenmp -O2 -Wall %s -o %s -lm -lgomp"
+elif os.name == 'nt':
+    COMPILE = "gcc -shared -fPIC -std=c99 -fopenmp -O2 -Wall %s -o %s -lm"
+else:
+    COMPILE = "cc -shared -fPIC -std=c99 -fopenmp -O2 -Wall %s -o %s -lm"
+DLL_PATH = "/tmp"
+def dll_path(info):
+    """
+    Path to the compiled model defined by *info*.
+    """
+    from os.path import join as joinpath, split as splitpath, splitext
+    basename = splitext(splitpath(info['filename'])[1])[0]
+    return joinpath(DLL_PATH, basename+'.so')
+def load_model(kernel_module, dtype=None):
+    """
+    Load the compiled model defined by *kernel_module*.
+    Recompile if any files are newer than the model file.
+    *dtype* is ignored.  Compiled files are always double.
+    The DLL is not loaded until the kernel is called so models an
+    be defined without using too many resources.
+    """
+    import tempfile
+    source, info = gen.make(kernel_module)
+    source_files = gen.sources(info) + [info['filename']]
+    newest = max(os.path.getmtime(f) for f in source_files)
+    dllpath = dll_path(info)
+    if not os.path.exists(dllpath) or os.path.getmtime(dllpath)<newest:
+        # Replace with a proper temp file
+        fid, filename = tempfile.mkstemp(suffix=".c",prefix="sas_"+info['name'])
+        os.fdopen(fid,"w").write(source)
+        status = os.system(COMPILE%(filename, dllpath))
+        if status != 0:
+            print "compile failed.  File is in %r"%filename
+        else:
+            ## uncomment the following to keep the generated c file
+            #os.unlink(filename); print "saving compiled file in %r"%filename
+            pass
+    return DllModel(dllpath, info)
 IQ_ARGS = [c_void_p, c_void_p, c_int, c_void_p, c_double]
 …
     """
     def __init__(self, kernel, info, input):
+        self.info = info
         self.input = input
         self.kernel = kernel

sasmodels/gen.py

-                      rff7119b
+                      r5d4777d
 *Iq*, *Iqxy*, *Imagnetic* and *form_volume* should be stylized C-99
+functions written for OpenCL.  Floating point values should be
+declared as *real*.  Depending on how the function is called, a macro
+will replace *real* with *float* or *double*.  Unfortunately, MacOSX
+is picky about floating point constants, which should be defined with
+value + 'f' if they are of type *float* or just a bare value if they
+are of type *double*.  The solution is a macro *REAL(value)* which
+adds the 'f' if compiling for single precision floating point.  This
+does make the code ugly, and may someday be replaced by a clever
+regular expression which does the same job.  OpenCL has a *sincos*
+function which can improve performance when both the *sin* and *cos*
+values are needed for a particular argument.  Since this function
+does not exist in C-99, all use of *sincos* should be replaced by the
+macro *SINCOS(value,sn,cn)* where *sn* and *cn* are previously declared
+*real* values.  *value* may be an expression.  When compiled for systems
+without OpenCL, *SINCOS* will be replaced by *sin* and *cos* calls.  All
+functions need prototype declarations even if the are defined before they
+are used -- another present from MacOSX.  OpenCL does not support
+*#include* preprocessor directives; instead the includes must be listed
+in the kernel metadata, with functions defined before they are used.
+The included files should be listed using relative path to the kernel
+source file, or if using one of the standard models, relative to the
+sasmodels source files.
+functions written for OpenCL.  All functions need prototype declarations
+even if the are defined before they are used.  OpenCL does not support
+*#include* preprocessor directives, so instead the list of includes needs
+to be given as part of the metadata in the kernel module definition.
+The included files should be listed using a path relative to the kernel
+module, or if using "lib/file.c" if it is one of the standard includes
+provided with the sasmodels source.  The includes need to be listed in
+order so that functions are defined before they are used.
+Floating point values should be declared as *real*.  Depending on how the
+function is called, a macro will replace *real* with *float* or *double*.
+Unfortunately, MacOSX is picky about floating point constants, which
+should be defined with value + 'f' if they are of type *float* or just
+a bare value if they are of type *double*.  The solution is a macro
+*REAL(value)* which adds the 'f' if compiling for single precision
+floating point.  [Note: we could write a clever regular expression
+which automatically detects real-valued constants.  If we wanted to
+make our code more C-like, we could define variables with double but
+replace them with float before compiling for single precision.]
+OpenCL has a *sincos* function which can improve performance when both
+the *sin* and *cos* values are needed for a particular argument.  Since
+this function does not exist in C99, all use of *sincos* should be
+replaced by the macro *SINCOS(value,sn,cn)* where *sn* and *cn* are
+previously declared *real* values.  *value* may be an expression.  When
+compiled for systems without OpenCL, *SINCOS* will be replaced by
+*sin* and *cos* calls.
+If the input parameters are invalid, the scattering calculator should
+return a negative number. Particularly with polydispersity, there are
+some sets of shape parameters which lead to nonsensical forms, such
+as a capped cylinder where the cap radius is smaller than the
+cylinder radius.  The polydispersity calculation will ignore these points,
+effectively chopping the parameter weight distributions at the boundary
+of the infeasible region.  The resulting scattering will be set to
+background.  This will work correctly even when polydispersity is off.
 *ER* and *VR* are python functions which operate on parameter vectors.
 …
     *VR* is a python function defining the volume ratio.  If it is not
     present, the volume ratio is 1.
+    *form_volume*, *Iq*, *Iqxy*, *Imagnetic* are strings containing the
+    C source code for the body of the volume, Iq, and Iqxy functions
+    respectively.  These can also be defined in the last source file.
 An *info* dictionary is constructed from the kernel meta data and
 …
 __all__ = ["make, doc", "sources"]
+import sys
+import os
 import os.path
 …
 #endif
 // Standard mathematical constants, prefixed with M_:
 //   E, LOG2E, LOG10E, LN2, LN10, PI, PI_2, PI_4, 1_PI, 2_PI,
 //   2_SQRTPI, SQRT2, SQRT1_2
+// Standard mathematical constants:
+//   M_E, M_LOG2E, M_LOG10E, M_LN2, M_LN10, M_PI, M_PI_2=pi/2, M_PI_4=pi/4,
+//   M_1_PI=1/pi, M_2_PI=2/pi, M_2_SQRTPI=2/sqrt(pi), SQRT2, SQRT1_2=sqrt(1/2)
 // OpenCL defines M_constant_F for float constants, and nothing if double
 // is not enabled on the card, which is why these constants may be missing
 …
     'qinit': "const real qi = q[i];",
     'qcall': "qi",
+    'qwork': ["q"],
+    }
 …
     'qinit': "const real qxi = qx[i];\n    const real qyi = qy[i];",
     'qcall': "qxi, qyi",
+    'qwork': ["qx", "qy"],
+    }
 …
 for (int %(name)s_i=0; %(name)s_i < N%(name)s; %(name)s_i++) {
   const real %(name)s = loops[2*(%(name)s_i%(offset)s)];
+  const real %(name)s_w = loops[2*(%(name)s_i%(offset)s)+1];"""
+  const real %(name)s_w = loops[2*(%(name)s_i%(offset)s)+1];\
+"""
 # Polydispersity loop body.
 …
 const real weight = %(weight_product)s;
 if (weight > cutoff) {
+  ret += weight*%(fn)s(%(qcall)s, %(pcall)s);
+  norm += weight;
+  %(volume_norm)s
+}"""
+  const real I = %(fn)s(%(qcall)s, %(pcall)s);
+  if (I>=REAL(0.0)) { // scattering cannot be negative
+    ret += weight*I;
+    norm += weight;
+    %(volume_norm)s
+  }
+  //else { printf("exclude qx,qy,I:%%g,%%g,%%g\\n",%(qcall)s,I); }
+}
+//else { printf("exclude weight:%%g\\n",weight); }\
+"""
+# Use this when integrating over orientation
+SPHERICAL_CORRECTION="""\
+// Correction factor for spherical integration p(theta) I(q) sin(theta) dtheta
+real spherical_correction = (Ntheta>1 ? fabs(cos(M_PI_180*phi)) : REAL(1.0));\
+"""
 # Volume normalization.
 …
 # a normalized weight.
 VOLUME_NORM="""const real vol_weight = %(weight)s;
+  vol += vol_weight*form_volume(%(pars)s);
+  norm_vol += vol_weight;"""
+    vol += vol_weight*form_volume(%(pars)s);
+    norm_vol += vol_weight;\
+"""
+# functions defined as strings in the .py module
+WORK_FUNCTION="""\
+real %(name)s(%(pars)s);
+real %(name)s(%(pars)s)
+{
+%(body)s
+}\
+"""
 # Documentation header for the module, giving the model name, its short
 …
     vol_pars = info['partype']['volume']
     q_pars = KERNEL_2D if is_2D else KERNEL_1D
+    fn = q_pars['fn']
     # Build polydispersity loops
 …
     fq_pars = [p[0] for p in info['parameters'][len(COMMON_PARAMETERS):]
                if p[0] in set(fixed_pars+pd_pars)]
+    if False and "phi" in pd_pars:
+        spherical_correction = [indent(SPHERICAL_CORRECTION, depth)]
+        weights = [p+"_w" for p in pd_pars]+['spherical_correction']
+    else:
+        spherical_correction = []
+        weights = [p+"_w" for p in pd_pars]
     subst = {
         'weight_product': "*".join(p+"_w" for p in pd_pars),
+        'weight_product': "*".join(weights),
         'volume_norm': volume_norm,
         'fn': q_pars['fn'],
+        'fn': fn,
         'qcall': q_pars['qcall'],
         'pcall': ", ".join(fq_pars), # skip scale and background
+        }
     loop_body = [indent(LOOP_BODY%subst, depth)]
     loops = "\n".join(loop_head+loop_body+loop_end)
+    loops = "\n".join(loop_head+spherical_correction+loop_body+loop_end)
     # declarations for non-pd followed by pd pars
 …
+        }
     kernel = KERNEL_TEMPLATE%subst
+    # If the working function is defined in the kernel metadata as a
+    # string, translate the string to an actual function definition
+    # and put it before the kernel.
+    if info[fn]:
+        subst = {
+            'name': fn,
+            'pars': ", ".join("real "+p for p in q_pars['qwork']+fq_pars),
+            'body': info[fn],
+            }
+        kernel = "\n".join((WORK_FUNCTION%subst, kernel))
     return kernel
 …
     search_path = [ dirname(info['filename']),
                     abspath(joinpath(dirname(__file__),'models')) ]
     return [_search(search_path) for f in info['source']]
+    return [_search(search_path, f) for f in info['source']]
 def make_model(info):
 …
     found in the given search path.
     """
+    source = [open(f).read() for f in sources(info)]
+    # If the form volume is defined as a string, then wrap it in a
+    # function definition and place it after the external sources but
+    # before the kernel functions.  If the kernel functions are strings,
+    # they will be translated in the make_kernel call.
+    if info['form_volume']:
+        subst = {
+            'name': "form_volume",
+            'pars': ", ".join("real "+p for p in info['partype']['volume']),
+            'body': info['form_volume'],
+            }
+        source.append(WORK_FUNCTION%subst)
     kernel_Iq = make_kernel(info, is_2D=False)
     kernel_Iqxy = make_kernel(info, is_2D=True)
-    source = [open(f).read() for f in sources(info)]
     kernel = "\n\n".join([KERNEL_HEADER]+source+[kernel_Iq, kernel_Iqxy])
     return kernel
 …
         name = kernel_module.name,
         title = kernel_module.title,
-        source = kernel_module.source,
         description = kernel_module.description,
         parameters = COMMON_PARAMETERS + kernel_module.parameters,
+        ER = getattr(kernel_module, 'ER', None),
+        VR = getattr(kernel_module, 'VR', None),
+        source = getattr(kernel_module, 'source', []),
+        )
+    # Fill in attributes which default to None
+    info.update((k,getattr(kernel_module, k, None))
+                for k in ('ER', 'VR', 'form_volume', 'Iq', 'Iqxy'))
+    # Fill in the derived attributes
     info['limits'] = dict((p[0],p[3]) for p in info['parameters'])
     info['partype'] = categorize_parameters(info['parameters'])
 …
     return DOC_HEADER%subst
-# Compiler platform details
-if sys.platform == 'darwin':
-    COMPILE = "gcc-mp-4.7 -shared -fPIC -std=c99 -fopenmp -O2 -Wall %s -o %s -lm -lgomp"
-elif os.name == 'nt':
-    COMPILE = "gcc -shared -fPIC -std=c99 -fopenmp -O2 -Wall %s -o %s -lm"
-else:
-    COMPILE = "cc -shared -fPIC -std=c99 -fopenmp -O2 -Wall %s -o %s -lm"
-DLL_PATH = "/tmp"
-def dll_path(info):
-    """
-    Path to the compiled model defined by *info*.
-    """
-    from os.path import join as joinpath, split as splitpath, splitext
-    basename = splitext(splitpath(info['filename'])[1])[0]
-    return joinpath(DLL_PATH, basename+'.so')
-def dll_model(kernel_module, dtype=None):
-    """
-    Load the compiled model defined by *kernel_module*.
-    Recompile if any files are newer than the model file.
-    *dtype* is ignored.  Compiled files are always double.
-    The DLL is not loaded until the kernel is called so models an
-    be defined without using too many resources.
-    """
-    import tempfile
-    from sasmodels import dll
-    source, info = make(kernel_module)
-    source_files = sources(info) + [info['filename']]
-    newest = max(os.path.getmtime(f) for f in source_files)
-    dllpath = dll_path(info)
-    if not os.path.exists(dllpath) or os.path.getmtime(dllpath)<newest:
-        # Replace with a proper temp file
-        srcfile = tempfile.mkstemp(suffix=".c",prefix="sas_"+info['name'])
-        open(srcfile, 'w').write(source)
-        os.system(COMPILE%(srcfile, dllpath))
-        ## comment the following to keep the generated c file
-        os.unlink(srcfile)
-    return dll.DllModel(dllpath, info)
-def opencl_model(kernel_module, dtype="single"):
-    """
-    Load the OpenCL model defined by *kernel_module*.
-    Access to the OpenCL device is delayed until the kernel is called
-    so models can be defined without using too many resources.
-    """
-    from sasmodels import gpu
-    source, info = make(kernel_module)
-    ## for debugging, save source to a .cl file, edit it, and reload as model
-    #open(modelname+'.cl','w').write(source)
-    #source = open(modelname+'.cl','r').read()
-    return gpu.GpuModel(source, info, dtype)

sasmodels/gpu.py

-                      rff7119b
+                      r5d4777d
 """
-import warnings
 import numpy as np
 import pyopencl as cl
 …
 from . import gen
-from .gen import F32, F64
 F32_DEFS = """\
 …
 # larger than necessary given that cost grows as npts^k where k is the number
 # of polydisperse parameters.
+MAX_LOOPS = 1024
+MAX_LOOPS = 2048
+def load_model(kernel_module, dtype="single"):
+    """
+    Load the OpenCL model defined by *kernel_module*.
+    Access to the OpenCL device is delayed until the kernel is called
+    so models can be defined without using too many resources.
+    """
+    source, info = gen.make(kernel_module)
+    ## for debugging, save source to a .cl file, edit it, and reload as model
+    open(info['name']+'.cl','w').write(source)
+    #source = open(info['name']+'.cl','r').read()
+    return GpuModel(source, info, dtype)
 ENV = None
 …
     """
     dtype = np.dtype(dtype)
     if dtype==F64 and not all(has_double(d) for d in context.devices):
+    if dtype==gen.F64 and not all(has_double(d) for d in context.devices):
         raise RuntimeError("Double precision not supported for devices")
     header = F64_DEFS if dtype == F64 else F32_DEFS
+    header = F64_DEFS if dtype == gen.F64 else F32_DEFS
     # Note: USE_SINCOS makes the intel cpu slower under opencl
     if context.devices[0].type == cl.device_type.GPU:
 …
     is an optional extension which may not be available on all devices.
     """
     def __init__(self, source, info, dtype=F32):
+    def __init__(self, source, info, dtype=gen.F32):
         self.info = info
         self.source = source
 …
     buffer will be released when the data object is freed.
     """
     def __init__(self, q_vectors, dtype=F32):
+    def __init__(self, q_vectors, dtype=gen.F32):
         env = environment()
         self.nq = q_vectors[0].size
 …
         env = environment()
         self.loops_b = [cl.Buffer(env.context, mf.READ_WRITE,
                                   MAX_LOOPS*input.dtype.itemsize)
+*MAX_LOOPS*input.dtype.itemsize)
                         for _ in env.queues]
         self.res_b = [cl.Buffer(env.context, mf.READ_WRITE,
 …
     def __call__(self, pars, pd_pars, cutoff=1e-5):
         real = np.float32 if self.input.dtype == F32 else np.float64
+        real = np.float32 if self.input.dtype == gen.F32 else np.float64
         fixed = [real(p) for p in pars]
         cutoff = real(cutoff)
         loops = np.hstack(pd_pars)
         loops = np.ascontiguousarray(loops.T, self.input.dtype).flatten()
+        loops_N = [np.uint32(len(p[0])) for p in pd_pars]
+        Nloops = [np.uint32(len(p[0])) for p in pd_pars]
+        #print "loops",Nloops, loops
         #import sys; print >>sys.stderr,"opencl eval",pars
         #print "opencl eval",pars
         if len(loops) > MAX_LOOPS:
+        if len(loops) > 2*MAX_LOOPS:
             raise ValueError("too many polydispersity points")
         device_num = 0
 …
         #ctx = environment().context
         #loops_bi = cl.Buffer(ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=loops)
         args = self.input.q_buffers + [res_bi,loops_bi,loops_l,cutoff] + fixed + loops_N
+        args = self.input.q_buffers + [res_bi,loops_bi,loops_l,cutoff] + fixed + Nloops
         self.kernel(queuei, self.input.global_size, None, *args)
         cl.enqueue_copy(queuei, self.res, res_bi)

sasmodels/models/README.rst

-                      rff7119b
+                      r5d4777d
 model.
+cylindermodel_onefile.py is cylinder.c+cylinder.py merged into one file.
+This doesn't actually run yet since sasmodels.gen has not been updated
+to support it.  It exists as a proposal.  Note that the function declaration
+has been removed since there is enough information in the parameter
+definitions to generate it automatically.  Note also that "source" which
+used to be all the source has been renamed "includes".
+One-file models could coexist with the py+c file models by checking for the
+existence of c_blah and creating the appropriate function wrappers.  These
+would be appended after any include files.  You shouldn't mix the two forms
+within a single model since form_volume needs to be defined before
+Iq/Iqxy but after the libraries.
+lamellar.py is an example of a single file model with embedded C code.
 Note: may want to rename form_volume to calc_volume and Iq/Iqxy to
+calc_Iq/calc_Iqxy in both the c+py and the one file forms so that the
+names are more predictable.  Similarly ER/VR go to calc_ER/calc_VR.
+calc_Iq/calc_Iqxy. Similarly ER/VR go to calc_ER/calc_VR.
 Note: It is possible to translate python code automatically to opencl, using
+something like numba, clyther, shedskin or pypy.
+something like numba, clyther, shedskin or pypy, so maybe the kernel functions
+could be implemented without any C syntax.
 Magnetism hasn't been implemented yet.  We may want a separate Imagnetic
 …
 Need to write code to generate the polydispersity loops in python for
+kernels that are only implemented in python.
+kernels that are only implemented in python.  Also, need to implement
+an example kernel directly in python.

sasmodels/models/cylinder.c

-                      rff7119b
+                      r5d4777d
 real form_volume(real radius, real length);
 real Iq(real q, real sld, real solvent_sld, real radius, real length);
+real Iqxy(real qx, real qy, real sld, real solvent_sld, real radius, real length, real theta, real phi);
+real Iqxy(real qx, real qy, real sld, real solvent_sld,
+    real radius, real length, real theta, real phi);
+// twovd = 2 * volume * delta_rho
+// besarg = q * R * sin(alpha)
+// siarg = q * L/2 * cos(alpha)
+real _cyl(real twovd, real besarg, real siarg);
+real _cyl(real twovd, real besarg, real siarg)
+{
+    const real bj = (besarg == REAL(0.0) ? REAL(0.5) : J1(besarg)/besarg);
+    const real si = (siarg == REAL(0.0) ? REAL(1.0) : sin(siarg)/siarg);
+    return twovd*si*bj;
+}
 real form_volume(real radius, real length)
 …
     real length)
+{
+    const real halflength = REAL(0.5)*length;
+    real summ = REAL(0.0);
+    const real qr = q*radius;
+    const real qh = q*REAL(0.5)*length;
+    const real twovd = REAL(2.0)*(sld-solvent_sld)*form_volume(radius, length);
+    real total = REAL(0.0);
     // real lower=0, upper=M_PI_2;
     for (int i=0; i<76 ;i++) {
         // translate a point in [-1,1] to a point in [lower,upper]
+        //const real zi = ( Gauss76Z[i]*(upper-lower) + upper + lower )/2.0;
+        const real zi = REAL(0.5)*(Gauss76Z[i]*M_PI_2 + M_PI_2);
+        summ += Gauss76Wt[i] * CylKernel(q, radius, halflength, zi);
+        //const real alpha = ( Gauss76Z[i]*(upper-lower) + upper + lower )/2.0;
+        const real alpha = REAL(0.5)*(Gauss76Z[i]*M_PI_2 + M_PI_2);
+        real sn, cn;
+        SINCOS(alpha, sn, cn);
+        const real fq = _cyl(twovd, qr*sn, qh*cn);
+        total += Gauss76Wt[i] * fq * fq * sn;
+    }
     // translate dx in [-1,1] to dx in [lower,upper]
+    //const real form = (upper-lower)/2.0*summ;
+    const real form = summ * M_PI_4;
+    // Multiply by contrast^2, normalize by cylinder volume and convert to cm-1
+    // NOTE that for this (Fournet) definition of the integral, one must MULTIPLY by Vcyl
+    // The additional volume factor is for polydisperse volume normalization.
+    const real s = (sld - solvent_sld) * form_volume(radius, length);
+    return REAL(1.0e-4) * form * s * s;
+    //const real form = (upper-lower)/2.0*total;
+    return REAL(1.0e-4) * total * M_PI_4;
+}
 …
     real phi)
+{
+    // TODO: check that radius<0 and length<0 give zero scattering.
+    // This should be the case since the polydispersity weight vector should
+    // be zero length, and this function never called.
     real sn, cn; // slots to hold sincos function output
 …
     const real alpha = acos(cos_val);
+    // The following is CylKernel() / sin(alpha), but we are doing it in place
+    // to avoid sin(alpha)/sin(alpha) for alpha = 0.  It is also a teensy bit
+    // faster since we don't mulitply and divide sin(alpha).
+    const real twovd = REAL(2.0)*(sld-solvent_sld)*form_volume(radius, length);
     SINCOS(alpha, sn, cn);
+    const real besarg = q*radius*sn;
+    const real siarg = REAL(0.5)*q*length*cn;
+    // lim_{x->0} J1(x)/x = 1/2,   lim_{x->0} sin(x)/x = 1
+    const real bj = (besarg == REAL(0.0) ? REAL(0.5) : J1(besarg)/besarg);
+    const real si = (siarg == REAL(0.0) ? REAL(1.0) : sin(siarg)/siarg);
+    const real form = REAL(4.0)*bj*bj*si*si;
+    // Multiply by contrast^2, normalize by cylinder volume and convert to cm-1
+    // NOTE that for this (Fournet) definition of the integral, one must MULTIPLY by Vcyl
+    // The additional volume factor is for polydisperse volume normalization.
+    const real s = (sld - solvent_sld) * form_volume(radius, length);
+    return REAL(1.0e-4) * form * s * s; // * correction;
+    const real fq = _cyl(twovd, q*radius*sn, q*REAL(0.5)*length*cn);
+    return REAL(1.0e-4) * fq * fq; // * correction;
+}

sasmodels/models/cylinder.py

-                      ra7684e5
+                      r5d4777d
+# cylinder model
 # Note: model title and parameter table are inserted automatically
 r"""
 …
 To provide easy access to the orientation of the cylinder, we define the
 axis of the cylinder using two angles $\theta$ and $\phi$. Those angles
 are defined in Figure :num:`figure #CylinderModel-orientation`.
+are defined in Figure :num:`figure #cylinder-orientation`.
 .. _CylinderModel-orientation:
+.. _cylinder-orientation:
 .. figure:: img/image061.JPG   (should be img/cylinder-1.jpg, or img/cylinder-orientation.jpg)
 …
 Validation of our code was done by comparing the output of the 1D model
 to the output of the software provided by the NIST (Kline, 2006).
 Figure :num:`figure #CylinderModel-compare` shows a comparison of
+Figure :num:`figure #cylinder-compare` shows a comparison of
 the 1D output of our model and the output of the NIST software.
 .. _CylinderModel-compare:
+.. _cylinder-compare:
 .. figure:: img/image065.JPG
 …
 the intensity for fully oriented cylinders, we can compare the result of
 averaging our 2D output using a uniform distribution $p(\theta, \phi) = 1.0$.
 Figure :num:`figure #CylinderModel-crosscheck` shows the result of
+Figure :num:`figure #cylinder-crosscheck` shows the result of
 such a cross-check.
 .. _CylinderModel-crosscheck:
+.. _cylinder-crosscheck:
 .. figure:: img/image066.JPG
 …
 title = "Right circular cylinder with uniform scattering length density."
 description = """
      f(q)= 2*(sldCyl - sldSolv)*V*sin(qLcos(alpha/2))
+     P(q)= 2*(sld - solvent_sld)*V*sin(qLcos(alpha/2))
             /[qLcos(alpha/2)]*J1(qRsin(alpha/2))/[qRsin(alpha)]
 …
             L: Length of the cylinder
             J1: The bessel function
             alpha: angle betweenthe axis of the
+            alpha: angle between the axis of the
             cylinder and the q-vector for 1D
             :the ouput is P(q)=scale/V*integral
             from pi/2 to zero of...
             f(q)^(2)*sin(alpha)*dalpha+ bkg
     """
+            f(q)^(2)*sin(alpha)*dalpha + background
+"""
 parameters = [
 …
+    ]
 source = [ "lib/J1.c", "lib/gauss76.c", "lib/cylkernel.c", "cylinder.c"]
+source = [ "lib/J1.c", "lib/gauss76.c", "cylinder.c" ]
 def ER(radius, length):

sasmodels/models/cylinder_clone.c

-                      rff7119b
+                      r5d4777d
 real Iq(real q, real sld, real solvent_sld, real radius, real length);
 real Iqxy(real qx, real qy, real sld, real solvent_sld, real radius, real length, real theta, real phi);
+// twovd = 2 * volume * delta_rho
+// besarg = q * R * sin(alpha)
+// siarg = q * L/2 * cos(alpha)
+real _cyl(real twovd, real besarg, real siarg, real alpha);
+real _cyl(real twovd, real besarg, real siarg, real alpha)
+{
+    const real bj = (besarg == REAL(0.0) ? REAL(0.5) : J1(besarg)/besarg);
+    const real si = (siarg == REAL(0.0) ? REAL(1.0) : sin(siarg)/siarg);
+    return twovd*si*bj;
+}
 real form_volume(real radius, real length)
 …
     return M_PI*radius*radius*length;
+}
 real Iq(real q,
     real sldCyl,
 …
     real length)
+{
+    const real h = REAL(0.5)*length;
+    real summ = REAL(0.0);
+    const real qr = q*radius;
+    const real qh = q*REAL(0.5)*length;
+    const real twovd = REAL(2.0)*(sldCyl-sldSolv)*form_volume(radius, length);
+    real total = REAL(0.0);
+    // real lower=0, upper=M_PI_2;
     for (int i=0; i<76 ;i++) {
+        //const real zi = ( Gauss76Z[i]*(uplim-lolim) + uplim + lolim )/2.0;
+        const real zi = REAL(0.5)*(Gauss76Z[i]*M_PI_2 + M_PI_2);
+        summ += Gauss76Wt[i] * CylKernel(q, radius, h, zi);
+        // translate a point in [-1,1] to a point in [lower,upper]
+        //const real alpha = ( Gauss76Z[i]*(upper-lower) + upper + lower )/2.0;
+        const real alpha = REAL(0.5)*(Gauss76Z[i]*M_PI_2 + M_PI_2);
+        real sn, cn;
+        SINCOS(alpha, sn, cn);
+        const real fq = _cyl(twovd, qr*sn, qh*cn, alpha);
+        total += Gauss76Wt[i] * fq * fq * sn;
+    }
+    //const real form = (uplim-lolim)/2.0*summ;
+    const real form = summ * M_PI_4;
+    // Multiply by contrast^2, normalize by cylinder volume and convert to cm-1
+    // NOTE that for this (Fournet) definition of the integral, one must MULTIPLY by Vcyl
+    // The additional volume factor is for polydisperse volume normalization.
+    const real s = (sldCyl - sldSolv) * form_volume(radius, length);
+    return REAL(1.0e8) * form * s * s;
+    // translate dx in [-1,1] to dx in [lower,upper]
+    //const real form = (upper-lower)/2.0*total;
+    return REAL(1.0e8) * total * M_PI_4;
+}
 …
     const real alpha = acos(cos_val);
     // The following is CylKernel() / sin(alpha), but we are doing it in place
     // to avoid sin(alpha)/sin(alpha) for alpha = 0.  It is also a teensy bit
     // faster since we don't mulitply and divide sin(alpha).
+    const real qr = q*radius;
+    const real qh = q*REAL(0.5)*length;
+    const real twovd = REAL(2.0)*(sldCyl-sldSolv)*form_volume(radius, length);
     SINCOS(alpha, sn, cn);
+    const real besarg = q*radius*sn;
+    const real siarg = REAL(0.5)*q*length*cn;
+    // lim_{x->0} J1(x)/x = 1/2,   lim_{x->0} sin(x)/x = 1
+    const real bj = (besarg == REAL(0.0) ? REAL(0.5) : J1(besarg)/besarg);
+    const real si = (siarg == REAL(0.0) ? REAL(1.0) : sin(siarg)/siarg);
+    const real form = REAL(4.0)*bj*bj*si*si;
+    // Multiply by contrast^2, normalize by cylinder volume and convert to cm-1
+    // NOTE that for this (Fournet) definition of the integral, one must MULTIPLY by Vcyl
+    // The additional volume factor is for polydisperse volume normalization.
+    const real s = (sldCyl - sldSolv) * form_volume(radius, length);
+    return REAL(1.0e8) * form * s * s * spherical_integration;
+    const real fq = _cyl(twovd, qr*sn, qh*cn, alpha);
+    return REAL(1.0e8) * fq * fq * spherical_integration;
+}

sasmodels/models/cylinder_clone.py

ra7684e5	r5d4777d
150	150	"Out of plane angle" ],
151	151	]
152		source = [ "lib/J1.c", "lib/gauss76.c", "~~lib/cylkernel.c", "cylinder_clone.c"~~]
	152	source = [ "lib/J1.c", "lib/gauss76.c", "cylinder_clone.c" ]
153	153
154	154	def ER(radius, length):

sasmodels/models/cylinder_onefile.py

-                      ra7684e5
+                      r5d4777d
 source = [ "lib/J1.c", "lib/gauss76.c", "lib/cylkernel.c" ]
 c_form_volume = """
+form_volume = """
     return M_PI*radius*radius*length;
 """
 c_Iq = """
+    """
+Iq = """
     const real h = REAL(0.5)*length;
     real summ = REAL(0.0);
 …
     const real s = (sld - solvent_sld) * form_volume(radius, length);
     return REAL(1.0e-4) * form * s * s;
 """
 c_Iqxy = """
+    """
+Iqxy = """
     real sn, cn; // slots to hold sincos function output
 …
     const real s = (sld - solvent_sld) * form_volume(radius, length);
     return REAL(1.0e-4) * form * s * s; // * correction;
 """
+    """
 def ER(radius, length):

sasmodels/models/ellipsoid.c

-                      rce27e21
+                      r5d4777d
+/* PARAMETERS
+real form_volume(real rpolar, real requatorial);
+real Iq(real q, real sld, real solvent_sld, real rpolar, real requatorial);
+real Iqxy(real qx, real qy, real sld, real solvent_sld,
+    real rpolar, real requatorial, real theta, real phi);
+real _ellipsoid_kernel(real q, real rpolar, real requatorial, real cos_alpha);
+real _ellipsoid_kernel(real q, real rpolar, real requatorial, real cos_alpha)
+{
+name: "ellipsoid",
+title: "Ellipsoid with uniform scattering length density",
+include: [ "lib/gauss76.c" ],
+parameters: [
+   // [ "name", "units", default, [lower, upper], "type", "description" ],
+   [ "sld", "1e-6/Ang^2", 4, [-Infinity,Infinity], "",
+     "Cylinder scattering length density" ],
+   [ "solvent_sld", "1e-6/Ang^2", 1, [-Infinity,Infinity], "",
+     "Solvent scattering length density" ],
+   [ "a", "Ang",  20, [0, Infinity], "volume",
+     "Cylinder radius" ],
+   [ "b", "Ang",  20, [0, Infinity], "volume",
+     "Cylinder length" ],
+   [ "theta", "degrees", 60, [-Infinity, Infinity], "orientation",
+     "In plane angle" ],
+   [ "phi", "degrees", 60, [-Infinity, Infinity], "orientation",
+     "Out of plane angle" ],
+],
+}
+PARAMETERS END
+DOCUMENTATION
+.. _EllipseModel:
+DOCUMENTATION END
+*/
+real form_volume(real a, real b);
+real Iq(real qx, real qy, real sld, real solvent_sld, real a, real b);
+real Iqxy(real qx, real qy, real sld, real solvent_sld, real a, real b, real theta, real phi);
+real form_volume(real a, real b)
+{
+    return REAL(1.333333333333333)*M_PI_2*a*b*b;
+    real sn, cn;
+    real ratio = rpolar/requatorial;
+    const real u = q*requatorial*sqrt(REAL(1.0)
+                   + cos_alpha*cos_alpha*(ratio*ratio - REAL(1.0)));
+    SINCOS(u, sn, cn);
+    const real f = ( u==REAL(0.0) ? REAL(1.0) : REAL(3.0)*(sn-u*cn)/(u*u*u) );
+    return f*f;
+}
 real ellipsoid_kernel(double q, double b, double a, double dum)
+real form_volume(real rpolar, real requatorial)
+{
+    real sn, cn;
+    const real nu = a/b;
+    const real arg = q * b * sqrt(REAL(1.0)+(dum*dum*(nu*nu--REAL(1.0))));
+    SINCOS(arg, sn, cn);
+    const real f = (arg==REAL(0.0) ? REAL(1.0) : REAL(3.0)*(sn-arg*cn)/(arg*arg*arg);
+    return f*f;
+    return REAL(1.333333333333333)*M_PI*rpolar*requatorial*requatorial;
+}
 …
     real sld,
     real solvent_sld,
     real a,
     real b)
+    real rpolar,
+    real requatorial)
+{
+    real summ = REAL(0.0);
+    //const real lower = REAL(0.0);
+    //const real upper = REAL(1.0);
+    real total = REAL(0.0);
     for (int i=0;i<76;i++) {
         //const real zi = ( Gauss76Z[i]*(uplim-lolim) + uplim + lolim )/2.0;
         zi = ( Gauss76Z[i] + REAL(1.0))/REAL(2.0);
         summ += Gauss76Wt[i] * ellipsoid_kernel(q, b, a, zi);
+        //const real cos_alpha = (Gauss76Z[i]*(upper-lower) + upper + lower)/2;
+        const real cos_alpha = REAL(0.5)*(Gauss76Z[i] + REAL(1.0));
+        total += Gauss76Wt[i] * _ellipsoid_kernel(q, rpolar, requatorial, cos_alpha);
+    }
     //const real form = (uplim-lolim)/2.0*summ;
     const real form = REAL(0.5)*summ
     const real s = (sld - sld_solvent) * form_volume(a, b);
+    //const real form = (upper-lower)/2*total;
+    const real form = REAL(0.5)*total;
+    const real s = (sld - solvent_sld) * form_volume(rpolar, requatorial);
     return REAL(1.0e-4) * form * s * s;
+}
 …
     real sld,
     real solvent_sld,
     real a,
     real b,
+    real rpolar,
+    real requatorial,
     real theta,
     real phi)
 …
     const real q = sqrt(qx*qx + qy*qy);
     SINCOS(theta*M_PI_180, sn, cn);
     const real cos_val = cn*cos(phi*M_PI_180)*(qx/q) + sn*(qy/q);
     const real form = ellipsoid_kernel(q, b, a, cos_val);
     const real s = (sld - solvent_sld) * form_volume(a, b);
+    const real cos_alpha = cn*cos(phi*M_PI_180)*(qx/q) + sn*(qy/q);
+    const real form = _ellipsoid_kernel(q, rpolar, requatorial, cos_alpha);
+    const real s = (sld - solvent_sld) * form_volume(rpolar, requatorial);
     return REAL(1.0e-4) * form * s * s;

sasmodels/sasview_model.py

-                      rff7119b
+                      r5d4777d
 try:
     import pyopencl
+    from .gen import opencl_model as load_model
+except ImportError:
+    from .gpu import load_model
+except ImportError,exc:
+    warnings.warn(str(exc))
     warnings.warn("OpenCL not available --- using ctypes instead")
     from .gen import dll_model as load_model
+    from .dll import load_model
 …
             # Check whether we have a list of ndarrays [qx,qy]
             qx, qy = qdist
+            return self.calculate_Iq(qx, qy)
+            partype = self._model.info['partype']
+            if not partype['orientation'] and not partype['magnetic']:
+                return self.calculate_Iq(np.sqrt(qx**2+qy**2))
+            else:
+                return self.calculate_Iq(qx, qy)
         elif isinstance(qdist, np.ndarray):

sasmodels/weights.py

-                      rff7119b
+                      r5d4777d
         """
         sigma = self.width * center if relative else self.width
+        if sigma == 0:
+            return np.array([center], 'd'), np.array([1.], 'd')
+        if sigma == 0 or self.npts < 2:
+            if lb <= center <= ub:
+                return np.array([center], 'd'), np.array([1.], 'd')
+            else:
+                return np.array([], 'd'), np.array([], 'd')
         return self._weights(center, sigma, lb, ub)

SasView

Changeset 5d4777d in sasmodels

Legend:

compare-new.py

sasmodels/bumps_model.py

sasmodels/dll.py

sasmodels/gen.py

sasmodels/gpu.py

sasmodels/models/README.rst

sasmodels/models/cylinder.c

sasmodels/models/cylinder.py

sasmodels/models/cylinder_clone.c

sasmodels/models/cylinder_clone.py

sasmodels/models/cylinder_onefile.py

sasmodels/models/ellipsoid.c

sasmodels/sasview_model.py

sasmodels/weights.py

Download in other formats: