expression.py @ b9d74f3

Last change on this file since b9d74f3 was b9d74f3, checked in by andyfaff, 8 years ago
MAINT: use raise Exception() not raise Exception
Property mode set to `100644`
File size: 13.6 KB

Rev	Line
[4e9f227]	1	# This program is public domain
	2	"""
	3	Parameter expression evaluator.
	4
	5	For systems in which constraints are expressed as string expressions rather
	6	than python code, :func:`compile_constraints` can construct an expression
	7	evaluator that substitutes the computed values of the expressions into the
	8	parameters.
	9
	10	The compiler requires a symbol table, an expression set and a context.
	11	The symbol table maps strings containing fully qualified names such as
	12	'M1.c[3].full_width' to parameter objects with a 'value' property that
	13	can be queried and set. The expression set maps symbol names from the
	14	symbol table to string expressions. The context provides additional symbols
	15	for the expressions in addition to the usual mathematical functions and
	16	constants.
	17
	18	The expressions are compiled and interpreted by python, with only minimal
	19	effort to make sure that they don't contain bad code. The resulting
	20	constraints function returns 0 so it can be used directly in a fit problem
	21	definition.
	22
	23	Extracting the symbol table from the model depends on the structure of the
	24	model. If fitness.parameters() is set correctly, then this should simply
	25	be a matter of walking the parameter data, remembering the path to each
	26	parameter in the symbol table. For compactness, dictionary elements should
	27	be referenced by .name rather than ["name"]. Model name can be used as the
	28	top level.
	29
	30	Getting the parameter expressions applied correctly is challenging.
	31	The following monkey patch works by overriding model_update in FitProblem
	32	so that after setp(p) is called and, the constraints expression can be
	33	applied before telling the underlying fitness function that the model
	34	is out of date::
	35
	36	# Override model update so that parameter constraints are applied
	37	problem._model_update = problem.model_update
	38	def model_update():
	39	constraints()
	40	problem._model_update()
	41	problem.model_update = model_update
	42
	43	Ideally, this interface will change
	44	"""
	45	import math
	46	import re
	47
	48	# simple pattern which matches symbols. Note that it will also match
	49	# invalid substrings such as a3...9, but given syntactically correct
	50	# input it will only match symbols.
	51	_symbol_pattern = re.compile('([a-zA-Z_][a-zA-Z_0-9.]*)')
	52
	53	def _symbols(expr,symtab):
	54	"""
	55	Given an expression string and a symbol table, return the set of symbols
	56	used in the expression. Symbols are only returned once even if they
	57	occur multiple times. The return value is a set with the elements in
	58	no particular order.
	59
	60	This is the first step in computing a dependency graph.
	61	"""
	62	matches = [m.group(0) for m in _symbol_pattern.finditer(expr)]
	63	return set([symtab[m] for m in matches if m in symtab])
	64
	65	def _substitute(expr,mapping):
	66	"""
	67	Replace all occurrences of symbol s with mapping[s] for s in mapping.
	68	"""
	69	# Find the symbols and the mapping
	70	matches = [(m.start(),m.end(),mapping[m.group(1)])
	71	for m in _symbol_pattern.finditer(expr)
	72	if m.group(1) in mapping]
	73
	74	# Split the expression in to pieces, with new symbols replacing old
	75	pieces = []
	76	offset = 0
	77	for start,end,text in matches:
	78	pieces += [expr[offset:start],text]
	79	offset = end
	80	pieces.append(expr[offset:])
	81
	82	# Join the pieces and return them
	83	return "".join(pieces)
	84
	85	def _find_dependencies(symtab, exprs):
	86	"""
	87	Returns a list of pair-wise dependencies from the parameter expressions.
	88
	89	For example, if p3 = p1+p2, then find_dependencies([p1,p2,p3]) will
	90	return [(p3,p1),(p3,p2)]. For base expressions without dependencies,
	91	such as p4 = 2*pi, this should return [(p4, None)]
	92	"""
	93	deps = [(target,source)
	94	for target,expr in exprs.items()
	95	for source in _symbols_or_none(expr,symtab)]
	96	return deps
	97
	98	# Hack to deal with expressions without dependencies --- return a fake
	99	# dependency of None.
	100	# The better solution is fix order_dependencies so that it takes a
	101	# dictionary of {symbol: dependency_list}, for which no dependencies
	102	# is simply []; fix in parameter_mapping as well
	103	def _symbols_or_none(expr,symtab):
	104	syms = _symbols(expr,symtab)
	105	return syms if len(syms) else [None]
	106
	107	def _parameter_mapping(pairs):
	108	"""
	109	Find the parameter substitution we need so that expressions can
	110	be evaluated without having to traverse a chain of
	111	model.layer.parameter.value
	112	"""
	113	left,right = zip(*pairs)
	114	pars = list(sorted(p for p in set(left+right) if p is not None))
	115	definition = dict( ('P%d'%i,p) for i,p in enumerate(pars) )
	116	# p is None when there is an expression with no dependencies
	117	substitution = dict( (p,'P%d.value'%i)
	118	for i,p in enumerate(sorted(pars))
	119	if p is not None)
	120	return definition, substitution
	121
	122	def no_constraints():
	123	"""
	124	This parameter set has no constraints between the parameters.
	125	"""
	126	pass
	127
	128	def compile_constraints(symtab, exprs, context={}):
	129	"""
	130	Build and return a function to evaluate all parameter expressions in
	131	the proper order.
	132
	133	Input:
	134
	135	symtab is the symbol table for the model: { 'name': parameter }
	136
	137	exprs is the set of computed symbols: { 'name': 'expression' }
	138
	139	context is any additional context needed to evaluate the expression
	140
	141	Return:
	142
	143	updater function which sets parameter.value for each expression
	144
	145	Raises:
	146
	147	AssertionError - model, parameter or function is missing
	148
	149	SyntaxError - improper expression syntax
	150
	151	ValueError - expressions have circular dependencies
	152
	153	This function is not terribly sophisticated, and it would be easy to
	154	trick. However it handles the common cases cleanly and generates
	155	reasonable messages for the common errors.
	156
	157	This code has not been fully audited for security. While we have
	158	removed the builtins and the ability to import modules, there may
	159	be other vectors for users to perform more than simple function
	160	evaluations. Unauthenticated users should not be running this code.
	161
	162	Parameter names are assumed to contain only _.a-zA-Z0-9#[]
	163
	164	Both names are provided for inverse functions, e.g., acos and arccos.
	165
	166	Should try running the function to identify syntax errors before
	167	running it in a fit.
	168
	169	Use help(fn) to see the code generated for the returned function fn.
	170	dis.dis(fn) will show the corresponding python vm instructions.
	171	"""
	172
	173	# Sort the parameters in the order they need to be evaluated
	174	deps = _find_dependencies(symtab, exprs)
	175	if deps == []: return no_constraints
	176	order = order_dependencies(deps)
	177
	178
	179	# Rather than using the full path to the parameters in the parameter
	180	# expressions, instead use Pn, and substitute Pn.value for each occurrence
	181	# of the parameter in the expression.
	182	names = list(sorted(symtab.keys()))
	183	parameters = dict(('P%d'%i, symtab[k]) for i,k in enumerate(names))
	184	mapping = dict((k, 'P%d.value'%i) for i,k in enumerate(names))
	185
	186
	187	# Initialize dictionary with available functions
	188	globals = {}
	189	globals.update(math.__dict__)
	190	globals.update(dict(arcsin=math.asin,arccos=math.acos,
	191	arctan=math.atan,arctan2=math.atan2))
	192	globals.update(context)
	193	globals.update(parameters)
	194	globals['id'] = id
	195	locals = {}
	196
	197	# Define the constraints function
	198	assignments = ["=".join((p,exprs[p])) for p in order]
	199	code = [_substitute(s, mapping) for s in assignments]
	200	functiondef = """
	201	def eval_expressions():
	202	'''
	203	%s
	204	'''
	205	%s
	206	return 0
	207	"""%("\n ".join(assignments),"\n ".join(code))
	208
	209	#print("Function: "+functiondef)
	210	exec functiondef in globals,locals
	211	retfn = locals['eval_expressions']
	212
	213	# Remove garbage added to globals by exec
	214	globals.pop('__doc__',None)
	215	globals.pop('__name__',None)
	216	globals.pop('__file__',None)
	217	globals.pop('__builtins__')
	218	#print globals.keys()
	219
	220	return retfn
	221
	222	def order_dependencies(pairs):
	223	"""
	224	Order elements from pairs so that b comes before a in the
	225	ordered list for all pairs (a,b).
	226	"""
	227	#print "order_dependencies",pairs
	228	emptyset = set()
	229	order = []
	230
	231	# Break pairs into left set and right set
	232	left,right = [set(s) for s in zip(*pairs)] if pairs != [] else ([],[])
	233	while pairs != []:
	234	#print "within",pairs
	235	# Find which items only occur on the right
	236	independent = right - left
	237	if independent == emptyset:
	238	cycleset = ", ".join(str(s) for s in left)
[b9d74f3]	239	raise ValueError("Cyclic dependencies amongst %s"%cycleset)
[4e9f227]	240
	241	# The possibly resolvable items are those that depend on the independents
	242	dependent = set([a for a,b in pairs if b in independent])
	243	pairs = [(a,b) for a,b in pairs if b not in independent]
	244	if pairs == []:
	245	resolved = dependent
	246	else:
	247	left,right = [set(s) for s in zip(*pairs)]
	248	resolved = dependent - left
	249	#print "independent",independent,"dependent",dependent,"resolvable",resolved
	250	order += resolved
	251	#print "new order",order
	252	order.reverse()
	253	return order
	254
	255	# ========= Test code ========
	256	def _check(msg,pairs):
	257	"""
	258	Verify that the list n contains the given items, and that the list
	259	satisfies the partial ordering given by the pairs in partial order.
	260	"""
	261	left,right = zip(*pairs) if pairs != [] else ([],[])
	262	items = set(left)
	263	n = order_dependencies(pairs)
	264	if set(n) != items or len(n) != len(items):
	265	n.sort()
	266	items = list(items); items.sort()
[b9d74f3]	267	raise Exception("%s expect %s to contain %s for %s"%(msg,n,items,pairs))
[4e9f227]	268	for lo,hi in pairs:
	269	if lo in n and hi in n and n.index(lo) >= n.index(hi):
[b9d74f3]	270	raise Exception("%s expect %s before %s in %s for %s"%(msg,lo,hi,n,pairs))
[4e9f227]	271
	272	def test_deps():
[9a5097c]	273	import numpy as np
[4e9f227]	274
	275	# Null case
	276	_check("test empty",[])
	277
	278	# Some dependencies
	279	_check("test1",[(2,7),(1,5),(1,4),(2,1),(3,1),(5,6)])
	280	_check("test1 renumbered",[(6,1),(7,3),(7,4),(6,7),(5,7),(3,2)])
[9a5097c]	281	_check("test1 numpy",np.array([(2,7),(1,5),(1,4),(2,1),(3,1),(5,6)]))
[4e9f227]	282
	283	# No dependencies
	284	_check("test2",[(4,1),(3,2),(8,4)])
	285
	286	# Cycle test
	287	pairs = [(1,4),(4,3),(4,5),(5,1)]
	288	try: n = order_dependencies(pairs)
	289	except ValueError: pass
[b9d74f3]	290	else: raise Exception("test3 expect ValueError exception for %s"%(pairs,))
[4e9f227]	291
	292	# large test for gross speed check
[9a5097c]	293	A = np.random.randint(4000,size=(1000,2))
[4e9f227]	294	A[:,1] += 4000 # Avoid cycles
	295	_check("test-large",A)
	296
	297	# depth tests
	298	k = 200
[9a5097c]	299	A = np.array([range(0,k),range(1,k+1)]).T
[4e9f227]	300	_check("depth-1",A)
	301
[9a5097c]	302	A = np.array([range(1,k+1),range(0,k)]).T
[4e9f227]	303	_check("depth-2",A)
	304
	305	def test_expr():
	306	import inspect, dis
	307	import math
	308
	309	symtab = {'a.b.x':1, 'a.c':2, 'a.b':3, 'b.x':4}
	310	expr = 'a.b.x + sin(4pia.c) + a.b.x/a.b'
	311
	312	# Check symbol lookup
	313	assert _symbols(expr, symtab) == set([1,2,3])
	314
	315	# Check symbol rename
	316	assert _substitute(expr,{'a.b.x':'Q'}) == 'Q + sin(4pia.c) + Q/a.b'
	317	assert _substitute(expr,{'a.b':'Q'}) == 'a.b.x + sin(4pia.c) + a.b.x/Q'
	318
	319
	320	# Check dependency builder
	321	# Fake parameter class
	322	class Parameter:
	323	def __init__(self, name, value=0, expression=''):
	324	self.path = name
	325	self.value = value
	326	self.expression = expression
	327	def iscomputed(self): return (self.expression != '')
	328	def __repr__(self): return self.path
	329	def world(*pars):
	330	symtab = dict((p.path,p) for p in pars)
	331	exprs = dict((p.path,p.expression) for p in pars if p.iscomputed())
	332	return symtab, exprs
	333	p1 = Parameter('G0.sigma',5)
	334	p2 = Parameter('other',expression='2pisin(G0.sigma/.1875) + M1.G1')
	335	p3 = Parameter('M1.G1',6)
	336	p4 = Parameter('constant',expression='2pi35')
	337	# Simple chain
	338	assert set(_find_dependencies(*world(p1,p2,p3))) == set([(p2.path,p1),(p2.path,p3)])
	339	# Constant expression
	340	assert set(_find_dependencies(*world(p1,p4))) == set([(p4.path,None)])
	341	# No dependencies
	342	assert set(_find_dependencies(*world(p1,p3))) == set([])
	343
	344	# Check function builder
	345	fn = compile_constraints(*world(p1,p2,p3))
	346
	347	# Inspect the resulting function
	348	if 0:
	349	print(inspect.getdoc(fn))
	350	print(dis.dis(fn))
	351
	352	# Evaluate the function and see if it updates the
	353	# target value as expected
	354	fn()
	355	expected = 2math.pimath.sin(5/.1875) + 6
	356	assert p2.value == expected,"Value was %s, not %s"%(p2.value,expected)
	357
	358	# Check empty dependency set doesn't crash
	359	fn = compile_constraints(*world(p1,p3))
	360	fn()
	361
	362	# Check that constants are evaluated properly
	363	fn = compile_constraints(*world(p4))
	364	fn()
	365	assert p4.value == 2math.pi35
	366
	367	# Check additional context example; this also tests multiple
	368	# expressions
	369	class Table:
	370	Si = 2.09
	371	values = {'Si': 2.07}
	372	tbl = Table()
	373	p5 = Parameter('lookup',expression="tbl.Si")
	374	fn = compile_constraints(*world(p1,p2,p3,p5),context=dict(tbl=tbl))
	375	fn()
	376	assert p5.value == 2.09,"Value for %s was %s"%(p5.expression,p5.value)
	377	p5.expression = "tbl.values['Si']"
	378	fn = compile_constraints(*world(p1,p2,p3,p5),context=dict(tbl=tbl))
	379	fn()
	380	assert p5.value == 2.07,"Value for %s was %s"%(p5.expression,p5.value)
	381
	382
	383	# Verify that we capture invalid expressions
	384	for expr in ['G4.cage', 'M0.cage', 'M1.G1 + *2',
	385	'piddle',
	386	'5; import sys; print "p0wned"',
	387	'__import__("sys").argv']:
	388	try:
	389	p6 = Parameter('broken',expression=expr)
	390	fn = compile_constraints(*world(p6))
	391	fn()
	392	except Exception as msg:
	393	#print(msg)
	394	pass
	395	else:
	396	raise "Failed to raise error for %s"%expr
	397
	398	if __name__ == "__main__":
	399	test_expr()
	400	test_deps()

Note: See TracBrowser for help on using the repository browser.

SasView

source: sasview/src/sas/sascalc/fit/expression.py @ b9d74f3

Download in other formats: