compare_many.py @ 17bbadd

core_shell_microgelscostrafo411magnetic_modelrelease_v0.94release_v0.95ticket-1257-vesicle-productticket_1156ticket_1265_superballticket_822_more_unit_tests

Last change on this file since 17bbadd was 17bbadd, checked in by Paul Kienzle <pkienzle@…>, 8 years ago
refactor so all model defintion queries use model_info; better documentation of model_info structure; initial implementation of product model (broken)
Property mode set to `100755`
File size: 8.8 KB

Line
1	#!/usr/bin/env python
2	"""
3	Program to compare results from many random parameter sets for a given model.
4
5	The result is a comma separated value (CSV) table that can be redirected
6	from standard output into a file and loaded into a spreadsheet.
7
8	The models are compared for each parameter set and if the difference is
9	greater than expected for that precision, the parameter set is labeled
10	as bad and written to the output, along with the random seed used to
11	generate that parameter value. This seed can be used with :mod:`compare`
12	to reload and display the details of the model.
13	"""
14	from __future__ import print_function
15
16	import sys
17	import traceback
18
19	import numpy as np
20
21	from . import core
22	from . import generate
23	from .compare import (MODELS, randomize_pars, suppress_pd, make_data,
24	make_engine, get_demo_pars, columnize,
25	constrain_pars, constrain_new_to_old)
26
27	def calc_stats(target, value, index):
28	"""
29	Calculate statistics between the target value and the computed value.
30
31	target and value are the vectors being compared, with the
32	difference normalized by target to get relative error. Only
33	the elements listed in index are used, though index may be
34	and empty slice defined by slice(None, None).
35
36	Returns:
37
38	maxrel the maximum relative difference
39
40	rel95 the relative difference with the 5% biggest differences ignored
41
42	maxabs the maximum absolute difference for the 5% biggest differences
43
44	maxval the maximum value for the 5% biggest differences
45	"""
46	resid = abs(value-target)[index]
47	relerr = resid/target[index]
48	sorted_rel_index = np.argsort(relerr)
49	#p90 = int(len(relerr)*0.90)
50	p95 = int(len(relerr)*0.95)
51	maxrel = np.max(relerr)
52	rel95 = relerr[sorted_rel_index[p95]]
53	maxabs = np.max(resid[sorted_rel_index[p95:]])
54	maxval = np.max(value[sorted_rel_index[p95:]])
55	return maxrel, rel95, maxabs, maxval
56
57	def print_column_headers(pars, parts):
58	"""
59	Generate column headers for the differences and for the parameters,
60	and print them to standard output.
61	"""
62	stats = list('Max rel err\|95% rel err\|Max abs err above 90% rel\|Max value above 90% rel'.split('\|'))
63	groups = ['']
64	for p in parts:
65	groups.append(p)
66	groups.extend(['']*(len(stats)-1))
67	groups.append("Parameters")
68	columns = ['Seed'] + stats*len(parts) + list(sorted(pars.keys()))
69	print(','.join('"%s"'%c for c in groups))
70	print(','.join('"%s"'%c for c in columns))
71
72	# Target 'good' value for various precision levels.
73	PRECISION = {
74	'fast': 1e-3,
75	'half': 1e-3,
76	'single': 5e-5,
77	'double': 5e-14,
78	'single!': 5e-5,
79	'double!': 5e-14,
80	'quad!': 5e-18,
81	'sasview': 5e-14,
82	}
83	def compare_instance(name, data, index, N=1, mono=True, cutoff=1e-5,
84	base='sasview', comp='double'):
85	r"""
86	Compare the model under different calculation engines.
87
88	name is the name of the model.
89
90	data is the data object giving $q, \Delta q$ calculation points.
91
92	index is the active set of points.
93
94	N is the number of comparisons to make.
95
96	cutoff is the polydispersity weight cutoff to make the calculation
97	a little bit faster.
98
99	base and comp are the names of the calculation engines to compare.
100	"""
101
102	is_2d = hasattr(data, 'qx_data')
103	model_info = core.load_model_info(name)
104	pars = get_demo_pars(model_info)
105	header = ('\n"Model","%s","Count","%d","Dimension","%s"'
106	% (name, N, "2D" if is_2d else "1D"))
107	if not mono: header += ',"Cutoff",%g'%(cutoff,)
108	print(header)
109
110	if is_2d:
111	partype = model_info['partype']
112	if not partype['orientation'] and not partype['magnetic']:
113	print(',"1-D only"')
114	return
115
116	# Some not very clean macros for evaluating the models and checking the
117	# results. They freely use variables from the current scope, even some
118	# which have not been defined yet, complete with abuse of mutable lists
119	# to allow them to update values in the current scope since nonlocal
120	# declarations are not available in python 2.7.
121	def try_model(fn, pars):
122	"""
123	Return the model evaluated at pars. If there is an exception,
124	print it and return NaN of the right shape.
125	"""
126	try:
127	result = fn(**pars)
128	except KeyboardInterrupt:
129	raise
130	except:
131	traceback.print_exc()
132	print("when comparing %s for %d"%(name, seed))
133	if hasattr(data, 'qx_data'):
134	result = np.NaN*data.data
135	else:
136	result = np.NaN*data.x
137	return result
138	def check_model(pars):
139	"""
140	Run the two calculators against pars, returning statistics
141	on the differences. See :func:`calc_stats` for the list of stats.
142	"""
143	base_value = try_model(calc_base, pars)
144	comp_value = try_model(calc_comp, pars)
145	stats = calc_stats(base_value, comp_value, index)
146	max_diff[0] = max(max_diff[0], stats[0])
147	good[0] = good[0] and (stats[0] < expected)
148	return list(stats)
149
150
151	calc_base = make_engine(model_info, data, base, cutoff)
152	calc_comp = make_engine(model_info, data, comp, cutoff)
153	expected = max(PRECISION[base], PRECISION[comp])
154
155	num_good = 0
156	first = True
157	max_diff = [0]
158	for k in range(N):
159	print("%s %d"%(name, k), file=sys.stderr)
160	seed = np.random.randint(1e6)
161	pars_i = randomize_pars(pars, seed)
162	constrain_pars(model_info['id'], pars_i)
163	constrain_new_to_old(model_info['id'], pars_i)
164	if mono:
165	pars_i = suppress_pd(pars_i)
166
167	good = [True]
168	columns = check_model(pars_i)
169	columns += [v for _, v in sorted(pars_i.items())]
170	if first:
171	labels = [" vs. ".join((calc_base.engine, calc_comp.engine))]
172	print_column_headers(pars_i, labels)
173	first = False
174	if good[0]:
175	num_good += 1
176	else:
177	print(("%d,"%seed)+','.join("%s"%v for v in columns))
178	print('"good","%d/%d","max diff",%g'%(num_good, N, max_diff[0]))
179
180
181	def print_usage():
182	"""
183	Print the command usage string.
184	"""
185	print("usage: compare_many.py MODEL COUNT (1dNQ\|2dNQ) (CUTOFF\|mono) (single\|double\|quad)")
186
187
188	def print_models():
189	"""
190	Print the list of available models in columns.
191	"""
192	print(columnize(MODELS, indent=" "))
193
194
195	def print_help():
196	"""
197	Print usage string, the option description and the list of available models.
198	"""
199	print_usage()
200	print("""\
201
202	MODEL is the model name of the model or "all" for all the models
203	in alphabetical order.
204
205	COUNT is the number of randomly generated parameter sets to try. A value
206	of "10000" is a reasonable check for monodisperse models, or "100" for
207	polydisperse models. For a quick check, use "100" and "5" respectively.
208
209	NQ is the number of Q values to calculate. If it starts with "1d", then
210	it is a 1-dimensional problem, with log spaced Q points from 1e-3 to 1.0.
211	If it starts with "2d" then it is a 2-dimensional problem, with linearly
212	spaced points Q points from -1.0 to 1.0 in each dimension. The usual
213	values are "1d100" for 1-D and "2d32" for 2-D.
214
215	CUTOFF is the cutoff value to use for the polydisperse distribution. Weights
216	below the cutoff will be ignored. Use "mono" for monodisperse models. The
217	choice of polydisperse parameters, and the number of points in the distribution
218	is set in compare.py defaults for each model.
219
220	PRECISION is the floating point precision to use for comparisons. If two
221	precisions are given, then compare one to the other, ignoring sasview.
222
223	Available models:
224	""")
225	print_models()
226
227	def main():
228	"""
229	Main program.
230	"""
231	if len(sys.argv) not in (6, 7):
232	print_help()
233	sys.exit(1)
234
235	model = sys.argv[1]
236	if not (model in MODELS) and (model != "all"):
237	print('Bad model %s. Use "all" or one of:'%model)
238	print_models()
239	sys.exit(1)
240	try:
241	count = int(sys.argv[2])
242	is2D = sys.argv[3].startswith('2d')
243	assert sys.argv[3][1] == 'd'
244	Nq = int(sys.argv[3][2:])
245	mono = sys.argv[4] == 'mono'
246	cutoff = float(sys.argv[4]) if not mono else 0
247	base = sys.argv[5]
248	comp = sys.argv[6] if len(sys.argv) > 6 else "sasview"
249	except:
250	traceback.print_exc()
251	print_usage()
252	sys.exit(1)
253
254	data, index = make_data({'qmax':1.0, 'is2d':is2D, 'nq':Nq, 'res':0.,
255	'accuracy': 'Low', 'view':'log'})
256	model_list = [model] if model != "all" else MODELS
257	for model in model_list:
258	compare_instance(model, data, index, N=count, mono=mono,
259	cutoff=cutoff, base=base, comp=comp)
260
261	if __name__ == "__main__":
262	#from .compare import push_seed
263	#with push_seed(1): main()
264	main()

Note: See TracBrowser for help on using the repository browser.

SasView

source: sasmodels/sasmodels/compare_many.py @ 17bbadd

Download in other formats: