← Previous Changeset
Next Changeset →

Changeset 8a20be5 in sasmodels

Timestamp:

Jul 10, 2014 3:05:08 PM (11 years ago)

Author:

HMP1 <helen.park@…>

Branches:

master, core_shell_microgels, costrafo411, magnetic_model, release_v0.94, release_v0.95, ticket-1257-vesicle-product, ticket_1156, ticket_1265_superball, ticket_822_more_unit_tests

Children:

Parents:

Message:

Added a fit2 (fits two different models at different angles)
(preliminary) Added CoreshellCyl? and CapCyl? Kernels
(preliminary) Updated kernels to include functions

Files:

: 6 added
: 8 edited

JUN03305.DAT (added)
Kernel-CapCyl.cpp (added)
Kernel-CoreShellCylinder.cpp (modified) (2 diffs)
Kernel-Cylinder.cpp (modified) (3 diffs)
Kernel-Lamellar.cpp (modified) (1 diff)
NR_BessJ1.cpp (added)
capcylcope.py (added)
compare.py (added)
coreshellcylcode.py (modified) (3 diffs)
cylcode.py (modified) (4 diffs)
fit.py (modified) (1 diff)
fit2.py (added)
lamellarcode.py (modified) (4 diffs)
sasmodel.py (modified) (5 diffs)

Legend:

: Unmodified
: Added
: Removed

Kernel-CoreShellCylinder.cpp

-                      r5378e40
+                      r8a20be5
         if (besarg1 == 0.0){be1 = 0.5;}
         else{
+            if((ax=fabs(besarg1)) < 8.0)
+            {
+                y=besarg1*besarg1;
+                ans1=besarg1*(72362614232.0+y*(-7895059235.0+y*(242396853.1+y*(-2972611.439+y*(15704.48260+y*(-30.16036606))))));
+                ans2=144725228442.0+y*(2300535178.0+y*(18583304.74+y*(99447.43394+y*(376.9991397+y*1.0))));
+                ans=ans1/ans2;
+            }
+            else
+            {
+                z=8.0/ax;
+                y=z*z;
+                xx=ax-2.356194491;
+                ans1=1.0+y*(0.183105e-2+y*(-0.3516396496e-4+y*(0.2457520174e-5+y*(-0.240337019e-6))));
+                ans2=0.04687499995+y*(-0.2002690873e-3+y*(0.8449199096e-5+y*(-0.88228987e-6+y*0.105787412e-6)));
+                ans=sqrt(0.636619772/ax)*(cos(xx)*ans1-z*sin(xx)*ans2);
+                if (besarg1 < 0.0) {ans *= -1;}
+            }
+            be1 = ans/besarg1;
+            bel = NR_BessJ1(besarg1)/besarg1
+        }
         if (besarg2 == 0.0){be2 = 0.5;}
 …

Kernel-Cylinder.cpp

-                      r5378e40
+                      r8a20be5
 __kernel void CylinderKernel(__global const float *qx, global const float *qy, __global float *_ptvalue, const float sub,
 const float rr, const float h, const float scale, const float radius_weight, const float length_weight,
 const float theta_weight, const float phi_weight, const float cyl_theta,
 const float cyl_phi, const int count, const int size)
+__kernel void CylinderKernel(__global const real *qx, global const real *qy, __global real *_ptvalue, const real sub,
+const real rr, const real h, const real scale, const real radius_weight, const real length_weight,
+const real theta_weight, const real phi_weight, const real cyl_theta,
+const real cyl_phi, const int count, const int size)
+{
         // qq is the q-value for the calculation (1/A)
 …
     if(i < count)
+    {
         float qq = sqrt(qx[i]*qx[i]+qy[i]*qy[i]);
+        real qq = sqrt(qx[i]*qx[i]+qy[i]*qy[i]);
         float pi = 4.0*atan(1.0);
         float theta = cyl_theta*pi/180.0;
         float phi = cyl_phi*pi/180.0;
+        real pi = 4.0*atan(1.0);
+        real theta = cyl_theta*pi/180.0;
+        real phi = cyl_phi*pi/180.0;
         float cyl_x = cos(theta)*cos(phi);
         float cyl_y = sin(theta);
         float cos_val = cyl_x*(qx[i]/qq) + cyl_y*(qy[i]/qq);
+        real cyl_x = cos(theta)*cos(phi);
+        real cyl_y = sin(theta);
+        real cos_val = cyl_x*(qx[i]/qq) + cyl_y*(qy[i]/qq);
         float alpha = acos(cos_val);
+        real alpha = acos(cos_val);
         if(alpha == 0.0){
             alpha = 1.0e-26;
+        }
+        float besarg = qq*rr*sin(alpha);
+        float siarg = qq*h/2*cos(alpha);
+        real besarg = qq*rr*sin(alpha);
+        real siarg = qq*h/2*cos(alpha);
+        real be=0.0; real si=0.0;
+            float xx=0.0; float y=0.0; float bj=0.0; float ans1=0.0; float ans2=0.0; float z=0.0; float answer=0.0;
+            float contrast=0.0; float form=0.0; float be=0.0; float si=0.0;
+        real bj = NR_BessJ1(besarg);
         float ax = fabs(besarg);
+        real d1 = qq*rr*sin(alpha);
+        if(ax < 8.0) {
+            y=besarg*besarg;
+            ans1=besarg*(72362614232.0+y*(-7895059235.0+y*(242396853.1+y*(-2972611.439+y*(15704.48260+y*(-30.16036606))))));
+            ans2=144725228442.0+y*(2300535178.0+y*(18583304.74+y*(99447.43394+y*(376.9991397+y*1.0))));
+            bj=ans1/ans2;
+        if (besarg == 0.0){
+            be = sin(alpha);
+        }
         else{
+            z=8.0/ax;
+            y=z*z;
+            xx=ax - 2.356194491;
+            ans1=1.0+y*(0.183105e-2+y*(-0.3516396496e-4+y*(0.2457520174e-5+y*(-0.240337019e-6))));
+            ans2=0.04687499995+y*(-0.2002690873e-3+y*(0.8449199096e-5+y*(-0.88228987e-6+y*0.105787412e-6)));
+            bj=sqrt(0.636619772/ax)*(cos(xx)*ans1-z*sin(xx)*ans2);
+            if(besarg < 0.0){bj*=-1;}
+            be = bj*bj*4.0*sin(alpha)/(d1*d1);
+        }
+        if(siarg == 0.0){
+            si = 1.0;
+        }
+        else{
+            si = sin(siarg)*sin(siarg)/(siarg*siarg);
+        }
+        float d1 = qq*rr*sin(alpha);
+        if (besarg == 0.0) {be = sin(alpha);}
+        else {be = bj*bj*4.0*sin(alpha)/(d1*d1);}
+        if(siarg == 0.0) {si = 1.0;}
+        else{si = sin(siarg)*sin(siarg)/(siarg*siarg);}
+        form = be*si/sin(alpha);
+        answer = sub*sub*form*acos(-1.0)*rr*rr*h*1.0e8*scale;
+        real form = be*si/sin(alpha);
+        real answer = sub*sub*form*acos(-1.0)*rr*rr*h*1.0e8*scale;
         _ptvalue[i] = radius_weight*length_weight*theta_weight*phi_weight*answer*pow(rr,2)*h;
 …
             _ptvalue[i] *= fabs(cos(cyl_theta*pi/180.0));
+        }
+}
+    }
+}

Kernel-Lamellar.cpp

-                      r5378e40
+                      r8a20be5
+__kernel void LamellarKernel(__global const float *qx, global const float *qy, __global float *ret, const float bi_thick,
+ const float scale, const float sub, const float background, const int length)
+#ifndef real
+# define real float
+#endif
+__kernel void LamellarKernel(__global const real *qx, global const real *qy, __global real *ret, const real bi_thick,
+ const real scale, const real sub, const real background, const int length)
+{
     int i = get_global_id(0);
     if(i < length)
+    {
         float q = sqrt(qx[i]*qx[i]+qy[i]*qy[i]);
         float pi = 4.0*atan(1.0);
         float Pq = 2.0*sub*(sub/q)/q*(1.0-cos(q*bi_thick));
+        real q = sqrt(qx[i]*qx[i]+qy[i]*qy[i]);
+        real pi = 4.0*atan(1.0);
+        real Pq = 2.0*sub*(sub/q)/q*(1.0-cos(q*bi_thick));
         ret[i] = 2.0*pi*scale*Pq/(q*q)/bi_thick*1.0e8;
         ret[i] += background;

coreshellcylcode.py

-                      r5378e40
+                      r8a20be5
 import pyopencl as cl
 from weights import GaussianDispersion
+from sasmodel import card
+def set_precision(src, qx, qy, dtype):
+    qx = np.ascontiguousarray(qx, dtype=dtype)
+    qy = np.ascontiguousarray(qy, dtype=dtype)
+    if np.dtype(dtype) == np.dtype('float32'):
+        header = """\
+#define real float
+"""
+    else:
+        header = """\
+#pragma OPENCL EXTENSION cl_khr_fp64: enable
+#define real double
+"""
+    return header+src, qx, qy
 class GpuCoreShellCylinder(object):
     PARS = {'scale':1, 'radius':1, 'thickness':1, 'length':1, 'core_sld':1e-6, 'shell_sld':1e-6, 'solvent_sld':0,
+    PARS = {'scale':1, 'radius':1, 'thickness':1, 'length':1, 'core_sld':1e-6, 'shell_sld':-1e-6, 'solvent_sld':0,
             'background':0, 'axis_theta':0, 'axis_phi':0}
     PD_PARS = ['radius', 'length', 'thickness', 'axis_phi', 'axis_theta']
+    def __init__(self, qx, qy):
+        self.qx = np.asarray(qx, np.float32)
+        self.qy = np.asarray(qy, np.float32)
+    def __init__(self, qx, qy, dtype='float32'):
         #create context, queue, and build program
+        self.ctx = cl.create_some_context()
+        self.queue = cl.CommandQueue(self.ctx)
+        self.prg = cl.Program(self.ctx, open('Kernel-CoreShellCylinder.cpp').read()).build()
+        ctx,_queue = card()
+        src, qx, qy = set_precision(open('NR_BessJ1.cpp').read()+"\n"+open('Kernel-CoreShellCylinder.cpp').read(), qx, qy, dtype=dtype)
+        self.prg = cl.Program(ctx, src).build()
+        self.qx, self.qy = qx, qy
         #buffers
         mf = cl.mem_flags
         self.qx_b = cl.Buffer(self.ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=self.qx)
         self.qy_b = cl.Buffer(self.ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=self.qy)
         self.res_b = cl.Buffer(self.ctx, mf.WRITE_ONLY, qx.nbytes)
         self.res = np.empty_like(self.qx)
+        self.qx_b = cl.Buffer(ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=self.qx)
+        self.qy_b = cl.Buffer(ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=self.qy)
+        self.res_b = cl.Buffer(ctx, mf.WRITE_ONLY, qx.nbytes)
+        self.res = np.empty_like(qx)
     def eval(self, pars):
+        _ctx,queue = card()
         radius, length, thickness, axis_phi, axis_theta = [GaussianDispersion(int(pars[base+'_pd_n']), pars[base+'_pd'], pars[base+'_pd_nsigma'])
                                      for base in GpuCoreShellCylinder.PD_PARS]
 …
                         for f in xrange(len(thickness.weight)):
                             self.prg.CoreShellCylinderKernel(self.queue, self.qx.shape, None, self.qx_b, self.qy_b, self.res_b,
+                            self.prg.CoreShellCylinderKernel(queue, self.qx.shape, None, self.qx_b, self.qy_b, self.res_b,
                                     np.float32(axis_theta.value[k]), np.float32(axis_phi.value[l]), np.float32(thickness.value[f]),
                                     np.float32(length.value[j]), np.float32(radius.value[i]), np.float32(pars['scale']),
 …
                                     np.float32(pars['shell_sld']), np.float32(pars['solvent_sld']),np.uint32(size),
                                     np.uint32(self.qx.size))
                             cl.enqueue_copy(self.queue, self.res, self.res_b)
+                            cl.enqueue_copy(queue, self.res, self.res_b)
                             sum += self.res

cylcode.py

-                      r5378e40
+                      r8a20be5
 import pyopencl as cl
 from weights import GaussianDispersion
+from sasmodel import card
+def set_precision(src, qx, qy, dtype):
+    qx = np.ascontiguousarray(qx, dtype=dtype)
+    qy = np.ascontiguousarray(qy, dtype=dtype)
+    if np.dtype(dtype) == np.dtype('float32'):
+        header = """\
+#define real float
+"""
+    else:
+        header = """\
+#pragma OPENCL EXTENSION cl_khr_fp64: enable
+#define real double
+"""
+    return header+src, qx, qy
 class GpuCylinder(object):
 …
     PD_PARS = ['radius', 'length', 'cyl_theta', 'cyl_phi']
     def __init__(self, qx, qy):
+    def __init__(self, qx, qy, dtype='float32'):
-        self.qx = np.asarray(qx, np.float32)
-        self.qy = np.asarray(qy, np.float32)
         #create context, queue, and build program
+        self.ctx = cl.create_some_context()
+        self.queue = cl.CommandQueue(self.ctx)
+        self.prg = cl.Program(self.ctx, open('Kernel-Cylinder.cpp').read()).build()
+        ctx,_queue = card()
+        src, qx, qy = set_precision(open('NR_BessJ1.cpp').read()+"\n"+open('Kernel-Cylinder.cpp').read(), qx, qy, dtype=dtype)
+        self.prg = cl.Program(ctx, src).build()
+        self.qx, self.qy = qx, qy
         #buffers
         mf = cl.mem_flags
         self.qx_b = cl.Buffer(self.ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=self.qx)
         self.qy_b = cl.Buffer(self.ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=self.qy)
         self.res_b = cl.Buffer(self.ctx, mf.WRITE_ONLY, qx.nbytes)
+        self.qx_b = cl.Buffer(ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=self.qx)
+        self.qy_b = cl.Buffer(ctx, mf.READ_ONLY | mf.COPY_HOST_PTR, hostbuf=self.qy)
+        self.res_b = cl.Buffer(ctx, mf.WRITE_ONLY, qx.nbytes)
         self.res = np.empty_like(self.qx)
     def eval(self, pars):
+        radius,length,cyl_theta,cyl_phi = \
+        _ctx,queue = card()
+        radius, length, cyl_theta, cyl_phi = \
             [GaussianDispersion(int(pars[base+'_pd_n']), pars[base+'_pd'], pars[base+'_pd_nsigma'])
              for base in GpuCylinder.PD_PARS]
 …
         sub = pars['sldCyl'] - pars['sldSolv']
+        real = np.float32 if self.qx.dtype == np.dtype('float32') else np.float64
         #Loop over radius, length, theta, phi weight points
         for i in xrange(len(radius.weight)):
 …
                     for l in xrange(len(cyl_phi.weight)):
+                        self.prg.CylinderKernel(self.queue, self.qx.shape, None, self.qx_b, self.qy_b, self.res_b, np.float32(sub),
+                                           np.float32(radius.value[i]), np.float32(length.value[j]), np.float32(pars['scale']),
+                                           np.float32(radius.weight[i]), np.float32(length.weight[j]), np.float32(cyl_theta.weight[k]),
+                                           np.float32(cyl_phi.weight[l]), np.float32(cyl_theta.value[k]), np.float32(cyl_phi.value[l]),
+                        self.prg.CylinderKernel(queue, self.qx.shape, None, self.qx_b, self.qy_b, self.res_b, real(sub),
+                                           real(radius.value[i]), real(length.value[j]), real(pars['scale']),
+                                           real(radius.weight[i]), real(length.weight[j]), real(cyl_theta.weight[k]),
+                                           real(cyl_phi.weight[l]), real(cyl_theta.value[k]), real(cyl_phi.value[l]),
                                            np.uint32(self.qx.size), np.uint32(size))
                         cl.enqueue_copy(self.queue, self.res, self.res_b)
+                        cl.enqueue_copy(queue, self.res, self.res_b)
                         sum += self.res
                         vol += radius.weight[i]*length.weight[j]*pow(radius.value[i], 2)*length.value[j]

fit.py

-                      r5378e40
+                      r8a20be5
 set_beam_stop(data, 0.004)
+"""
 model = SasModel(data, GpuCylinder, scale=1, radius=64.1, length=266.96, sldCyl=.291e-6, sldSolv=5.77e-6, background=0,
                               cyl_theta=0, cyl_phi=0, radius_pd=0.1, radius_pd_n=10, radius_pd_nsigma=3,length_pd=0.1,
                               length_pd_n=5, length_pd_nsigma=3, cyl_theta_pd=0.1, cyl_theta_pd_n=5, cyl_theta_pd_nsigma=3,
+                              cyl_phi_pd=0.1, cyl_phi_pd_n=10, cyl_phi_pd_nsigma=3,)
+                              cyl_phi_pd=0.1, cyl_phi_pd_n=10, cyl_phi_pd_nsigma=3, dtype='float32')
+model.radius.range(0,100)
+model.length.range(0, 1000)
+model.cyl_theta.range(0,90)
+model.cyl_phi.range(0,90)
+"""
 model = SasModel(data, GpuEllipse, scale=.027, radius_a=60, radius_b=180, sldEll=.297e-6, sldSolv=5.773e-6, background=4.9,
                  axis_theta=0, axis_phi=90, radius_a_pd=0.1, radius_a_pd_n=10, radius_a_pd_nsigma=3, radius_b_pd=0.1, radius_b_pd_n=10,
                  radius_b_pd_nsigma=3, axis_theta_pd=0.1, axis_theta_pd_n=6, axis_theta_pd_nsigma=3, axis_phi_pd=0.1,
                  axis_phi_pd_n=6, axis_phi_pd_nsigma=3)
+                 axis_phi_pd_n=6, axis_phi_pd_nsigma=3, dtype='float')
 model = SasModel(data, GpuLamellar, scale=1, bi_thick=100, sld_bi=.291e-6, sld_sol=5.77e-6, background=0,
                  bi_thick_pd=0.1, bi_thick_pd_n=35, bi_thick_pd_nsigma=3)
+                 bi_thick_pd=0.1, bi_thick_pd_n=35, bi_thick_pd_nsigma=3, dtype='float')
+"""
 model = SasModel(data, GpuCoreShellCylinder, scale=1, radius=64.1, thickness=1, length=266.96, core_sld=.251e-6, shell_sld=6.2e-6,
                  solvent_sld=5.77e-6, background=0, axis_theta=0, axis_phi=0, radius_pd=0.1, radius_pd_n=10, radius_pd_nsigma=3,
+model = SasModel(data, GpuCoreShellCylinder, scale=1, radius=64.1, thickness=1, length=266.96, core_sld=1e-6, shell_sld=1e-6,
+                 solvent_sld=4e-6, background=0, axis_theta=0, axis_phi=0, radius_pd=0.1, radius_pd_n=10, radius_pd_nsigma=3,
                  length_pd=0.1, length_pd_n=10, length_pd_nsigma=3, thickness_pd=0.1, thickness_pd_n=2, thickness_pd_nsigma=3,
                  axis_theta_pd=0.1, axis_theta_pd_n=2, axis_theta_pd_nsigma=3, axis_phi_pd=0.1, axis_phi_pd_n=2,
+                 axis_phi_pd_nsigma=3)
+                 axis_phi_pd_nsigma=3, dtype='float')
+"""
 model.scale.range(0,10)

lamellarcode.py

-                      r5378e40
+                      r8a20be5
 import numpy as np
-import math
 import pyopencl as cl
 from weights import GaussianDispersion
+def set_precision(src, qx, qy, dtype):
+    qx = np.ascontiguousarray(qx, dtype=dtype)
+    qy = np.ascontiguousarray(qy, dtype=dtype)
+    if dtype == 'double':
+        header = """\
+#pragma OPENCL EXTENSION cl_khr_fp64: enable
+#define real double
+"""
+        return header+src,qx,qy
+    else:
+        return src,qx,qy
 …
         'scale':1, 'bi_thick':1, 'sld_bi':1e-6, 'sld_sol':0, 'background':0,
+    }
-    PD_PARS = ['bi_thick']
     def __init__(self, qx, qy):
+    def __init__(self, qx, qy, dtype='float'):
-        self.qx = np.asarray(qx, np.float32)
-        self.qy = np.asarray(qy, np.float32)
         #create context, queue, and build program
         self.ctx = cl.create_some_context()
         self.queue = cl.CommandQueue(self.ctx)
+        self.prg = cl.Program(self.ctx, open('Kernel-Lamellar.cpp').read()).build()
+        src,qx,qy = set_precision(open('Kernel-Lamellar.cpp').read(), qx, qy, dtype=dtype)
+        self.prg = cl.Program(self.ctx, src).build()
+        self.qx, self.qy = qx, qy
         #buffers
 …
         sub = pars['sld_bi'] - pars['sld_sol']
+        real = np.float32 if self.qx.dtype == np.dtype('float32') else np.float64
         for i in xrange(len(bi_thick.weight)):
             self.prg.LamellarKernel(self.queue, self.qx.shape, None, self.qx_b, self.qy_b, self.res_b, np.float32(bi_thick.value[i]),
                                     np.float32(pars['scale']), np.float32(sub), np.float32(pars['background']), np.uint32(self.qx.size))
+            self.prg.LamellarKernel(self.queue, self.qx.shape, None, self.qx_b, self.qy_b, self.res_b, real(bi_thick.value[i]),
+                                    real(pars['scale']), real(sub), real(pars['background']), np.uint32(self.qx.size))
             cl.enqueue_copy(self.queue, self.res, self.res_b)
 …
         return sum/norm + pars['background']
-    def lamellar_fit(self, pars, b_n=10, b_w=.1, sigma=3):
-        bi_thick = GaussianDispersion(b_n, b_w, sigma)
-        bi_thick.value, bi_thick.weight = bi_thick.get_weights(pars.bi_thick, 0, 1000, True)
-        sum, norm = 0.0, 0.0
-        for i in xrange(len(bi_thick.weight)):
-            self.prg.LamellarKernel(self.queue, self.qx.shape, None, self.qx_b, self.qy_b, self.res_b, np.float32(bi_thick.value[i]),
-                                    np.float32(pars.scale), np.float32(pars.sld_bi), np.float32(pars.sld_sol),
-                                    np.float32(pars.background), np.uint32(self.qx.size))
-            cl.enqueue_copy(self.queue, self.res, self.res_b)
-            sum += bi_thick.weight[i]*self.res
-            norm += bi_thick.weight[i]
-        return sum/norm + pars.background
 def demo():

sasmodel.py

-                      r5378e40
+                      r8a20be5
 import numpy as np
+import pyopencl as cl
 from bumps.names import Parameter
 from sans.dataloader.loader import Loader
 …
     loader = Loader()
     data = loader.load(filename)
+    if data is None:
+        raise IOError("Data %r could not be loaded"%filename)
     return data
 …
+GPU_CONTEXT = None
+GPU_QUEUE = None
+def card():
+    global GPU_CONTEXT, GPU_QUEUE
+    if GPU_CONTEXT is None:
+        GPU_CONTEXT = cl.create_some_context()
+        GPU_QUEUE = cl.CommandQueue(GPU_CONTEXT)
+    return GPU_CONTEXT, GPU_QUEUE
 class SasModel(object):
     def __init__(self, data, model, **kw):
+    def __init__(self, data, model, dtype='float32', **kw):
         self.index = data.mask==0
         self.iq = data.data[self.index]
 …
         self.qx = data.qx_data
         self.qy = data.qy_data
         self.gpu = model(self.qx, self.qy)
+        self.gpu = model(self.qx, self.qy, dtype=dtype)
         pd_pars = set(base+attr for base in model.PD_PARS for attr in ('_pd','_pd_n','_pd_nsigma'))
         total_pars = set(model.PARS.keys()) | pd_pars
 …
     def theory(self):
         pars = dict((k,v.value) for k,v in self._parameters.items())
+        print pars
         result = self.gpu.eval(pars)
         return result

Note: See TracChangeset for help on using the changeset viewer.

Download in other formats: