from types import MethodType
from collections import OrderedDict
from pyparsing import TokenConverter, ParseResults, originalTextFor
from rdflib import BNode, Variable, URIRef
DEBUG = True
DEBUG = False
if DEBUG:
import traceback
"""
NOTE: PyParsing setResultName/__call__ provides a very similar solution to this
I didn't realise at the time of writing and I will remove a
lot of this code at some point
Utility classes for creating an abstract-syntax tree out with pyparsing actions
Lets you label and group parts of parser production rules
For example:
# [5] BaseDecl ::= 'BASE' IRIREF
BaseDecl = Comp('Base', Keyword('BASE') + Param('iri',IRIREF))
After parsing, this gives you back an CompValue object,
which is a dict/object with the paramters specified.
So you can access the parameters are attributes or as keys:
baseDecl.iri
Comp lets you set an evalFn that is bound to the eval method of
the resulting CompValue
"""
# This is an alternative
# Comp('Sum')( Param('x')(Number) + '+' + Param('y')(Number) )
[docs]def value(ctx, val, variables=False, errors=False):
"""
utility function for evaluating something...
Variables will be looked up in the context
Normally, non-bound vars is an error,
set variables=True to return unbound vars
Normally, an error raises the error,
set errors=True to return error
"""
if isinstance(val, Expr):
return val.eval(ctx) # recurse?
elif isinstance(val, CompValue):
raise Exception("What do I do with this CompValue? %s" % val)
elif isinstance(val, list):
return [value(ctx, x, variables, errors) for x in val]
elif isinstance(val, (BNode, Variable)):
r = ctx.get(val)
if isinstance(r, SPARQLError) and not errors:
raise r
if r is not None:
return r
# not bound
if variables:
return val
else:
raise NotBoundError
elif isinstance(val, ParseResults) and len(val) == 1:
return value(ctx, val[0], variables, errors)
else:
return val
[docs]class ParamValue(object):
"""
The result of parsing a Param
This just keeps the name/value
All cleverness is in the CompValue
"""
[docs] def __init__(self, name, tokenList, isList):
self.isList = isList
self.name = name
if isinstance(tokenList, (list, ParseResults)) and len(tokenList) == 1:
tokenList = tokenList[0]
self.tokenList = tokenList
[docs] def __str__(self):
return "Param(%s, %s)" % (self.name, self.tokenList)
[docs]class Param(TokenConverter):
"""
A pyparsing token for labelling a part of the parse-tree
if isList is true repeat occurrences of ParamList have
their values merged in a list
"""
[docs] def __init__(self, name, expr, isList=False):
self.name = name
self.isList = isList
TokenConverter.__init__(self, expr)
self.addParseAction(self.postParse2)
[docs] def postParse2(self, tokenList):
return ParamValue(self.name, tokenList, self.isList)
[docs]class ParamList(Param):
"""
A shortcut for a Param with isList=True
"""
[docs] def __init__(self, name, expr):
Param.__init__(self, name, expr, True)
[docs]class plist(list):
"""this is just a list, but we want our own type to check for"""
pass
[docs]class CompValue(OrderedDict):
"""
The result of parsing a Comp
Any included Params are avaiable as Dict keys
or as attributes
"""
[docs] def __init__(self, name, **values):
OrderedDict.__init__(self)
self.name = name
self.update(values)
[docs] def clone(self):
return CompValue(self.name, **self)
[docs] def __str__(self):
return self.name + "_" + OrderedDict.__str__(self)
[docs] def __repr__(self):
return self.name + "_" + dict.__repr__(self)
def _value(self, val, variables=False, errors=False):
if self.ctx is not None:
return value(self.ctx, val, variables)
else:
return val
[docs] def __getitem__(self, a):
return self._value(OrderedDict.__getitem__(self, a))
[docs] def get(self, a, variables=False, errors=False):
return self._value(OrderedDict.get(self, a, a), variables, errors)
[docs] def __getattr__(self, a):
# Hack hack: OrderedDict relies on this
if a in ('_OrderedDict__root', '_OrderedDict__end'):
raise AttributeError
try:
return self[a]
except KeyError:
# raise AttributeError('no such attribute '+a)
return None
[docs]class Expr(CompValue):
"""
A CompValue that is evaluatable
"""
[docs] def __init__(self, name, evalfn=None, **values):
super(Expr, self).__init__(name, **values)
self._evalfn = None
if evalfn:
self._evalfn = MethodType(evalfn, self)
[docs] def eval(self, ctx={}):
try:
self.ctx = ctx
return self._evalfn(ctx)
except SPARQLError as e:
return e
finally:
self.ctx = None
[docs]class Comp(TokenConverter):
"""
A pyparsing token for grouping together things with a label
Any sub-tokens that are not Params will be ignored.
Returns CompValue / Expr objects - depending on whether evalFn is set.
"""
[docs] def __init__(self, name, expr):
self.expr = expr
TokenConverter.__init__(self, expr)
self.name = name
self.evalfn = None
[docs] def postParse(self, instring, loc, tokenList):
if self.evalfn:
res = Expr(self.name)
res._evalfn = MethodType(self.evalfn, res)
else:
res = CompValue(self.name)
if self.name == 'ServiceGraphPattern':
# Then this must be a service graph pattern and have
# already matched.
# lets assume there is one, for now, then test for two later.
sgp = originalTextFor(self.expr)
service_string = sgp.searchString(instring)[0][0]
res['service_string'] = service_string
for t in tokenList:
if isinstance(t, ParamValue):
if t.isList:
if not t.name in res:
res[t.name] = plist()
res[t.name].append(t.tokenList)
else:
res[t.name] = t.tokenList
# res.append(t.tokenList)
# if isinstance(t,CompValue):
# res.update(t)
return res
[docs] def setEvalFn(self, evalfn):
self.evalfn = evalfn
return self
[docs]def prettify_parsetree(t, indent='', depth=0):
out = []
if isinstance(t, ParseResults):
for e in t.asList():
out.append(prettify_parsetree(e, indent, depth + 1))
for k, v in sorted(t.items()):
out.append("%s%s- %s:\n" % (indent, ' ' * depth, k))
out.append(prettify_parsetree(v, indent, depth + 1))
elif isinstance(t, CompValue):
out.append("%s%s> %s:\n" % (indent, ' ' * depth, t.name))
for k, v in t.items():
out.append("%s%s- %s:\n" % (indent, ' ' * (depth + 1), k))
out.append(prettify_parsetree(v, indent, depth + 2))
elif isinstance(t, dict):
for k, v in t.items():
out.append("%s%s- %s:\n" % (indent, ' ' * (depth + 1), k))
out.append(prettify_parsetree(v, indent, depth + 2))
elif isinstance(t, list):
for e in t:
out.append(prettify_parsetree(e, indent, depth + 1))
else:
out.append("%s%s- %r\n" % (indent, ' ' * depth, t))
return "".join(out)
if __name__ == '__main__':
from pyparsing import Word, nums
import sys
Number = Word(nums)
Number.setParseAction(lambda x: int(x[0]))
Plus = Comp('plus', Param('a', Number) + '+' + Param('b', Number))
Plus.setEvalFn(lambda self, ctx: self.a + self.b)
r = Plus.parseString(sys.argv[1])
print(r)
print(r[0].eval({}))
# hurrah for circular imports
from rdflib.plugins.sparql.sparql import SPARQLError, NotBoundError