"""
A macro mechanism primarily for string replacement in resource descriptors.
"""
#c Copyright 2008-2023, the GAVO project <gavo@ari.uni-heidelberg.de>
#c
#c This program is free software, covered by the GNU GPL. See the
#c COPYING file in the source distribution.
import datetime
import re
import urllib.request, urllib.parse, urllib.error
from gavo import utils
from gavo.base import attrdef
from gavo.base import common
from gavo.base import complexattrs
from gavo.base import config
from gavo.base import meta
from gavo.base import osinter
from gavo.base import structure
from gavo.utils.parsetricks import (
ZeroOrMore, Forward,
Regex, Suppress,
Literal, pyparsingWhitechars)
[docs]class MacroError(common.StructureError):
"""is raised when something bad happens during macro expansion.
It is constructed with an error message, a macro name, and optionally
a hint and a position.
"""
def __init__(self, message, macroName, hint=None, pos=None):
common.StructureError.__init__(
self, macroName+" failed", pos=pos, hint=hint)
self.args = [message, macroName, hint, pos]
self.macroName, self.message = macroName, message
def __str__(self):
return "Error during macro expansion: %s"%(
self.message)
[docs]class MacroExpander(object):
"""is a generic "macro" expander for scripts of all kinds.
It is loosely inspired by TeX, but of course much simpler. See the
syntax below.
The macros themselves come from a MacroPackage object. There are
a few of these around, implementing different functionality depending
on the script context (i.e., whether it belongs to an RD, a DD, or
a Table.
All macros are just functions receiving and returning strings. The
arguments are written as {arg1}{arg2}, where you can escape curly
braces with a backslash. There must be no whitespace between
a macro and its first argument.
If you need to glue together a macro expansion and text following,
use the glue sequence \\+
The main entry point to the class is the expand function below,
taking a string possibly containing macro calls and returning
a string.
The construction of such a macro expander is relatively expensive,
so it pays to cache them. MacroPackage below has a getExpander
method that does the caching for you.
"""
def __init__(self, package):
self.package = package
self._macroGrammar = self._getMacroGrammar()
def _execMacro(self, s, loc, toks):
toks = toks.asList()
macName, args = toks[0], toks[1:]
return self.package.execMacro(macName, args)
[docs] def expand(self, aString):
return utils.pyparseTransform(self._macroGrammar, aString)
def _getMacroGrammar(self, debug=False):
with pyparsingWhitechars(" \t"):
macro = Forward()
quoteEscape = (Literal("\\{").addParseAction(lambda *args: "{") |
Literal("\\}").addParseAction(lambda *args: "}"))
charRun = Regex(r"[^}\\]+").leaveWhitespace()
argElement = macro | quoteEscape | charRun
argument = Suppress("{") + ZeroOrMore(argElement) + Suppress("}")
argument.addParseAction(lambda s, pos, toks: "".join(toks))
arguments = ZeroOrMore(argument)
arguments.setWhitespaceChars("")
macroName = Regex("[A-Za-z_][A-Za-z_0-9]+")
macroName.setWhitespaceChars("")
macro << Suppress( "\\" ) + macroName + arguments
macro.addParseAction(self._execMacro)
literalBackslash = Literal("\\\\")
literalBackslash.addParseAction(lambda *args: "\\")
suppressedLF = Literal("\\\n")
suppressedLF.addParseAction(lambda *args: " ")
glue = Literal("\\+")
glue.addParseAction(lambda *args: "")
return literalBackslash | suppressedLF | glue | macro
[docs]class ExpansionDelegator(object):
"""A mixin to make a class expand macros by delegating everything to
its parent.
This is intended for base.Structures that have a parent attribute;
by mixing this in, they use their parents to expand macros for them.
"""
[docs] def expand(self, aString):
return self.parent.expand(aString)
[docs]class MacroPackage(common.StructCallbacks):
r"""is a function dispatcher for MacroExpander.
Basically, you inherit from this class and define macro_xxx functions.
MacroExpander can then call \xxx, possibly with arguments.
"""
def __findMacro(self, macName):
fun = getattr(self, "macro_"+macName, None)
if fun is not None:
return fun
# this is a bit of a hack so subordinate objects see macDefs from
# their RDs; generally, we don't inherit macros, as they are bound
# to types in DaCHS.
if hasattr(self, "rd"):
fun = getattr(self.rd, "macro_"+macName, None)
if fun is not None:
return fun
raise MacroError(
"No macro \\%s available in a %s context"%(
macName, self.__class__.__name__),
macName, hint="%s objects have the following macros: %s."%(
self.__class__.__name__, ", ".join(self.listMacros())))
[docs] def listMacros(self):
return [n[6:] for n in dir(self) if n.startswith("macro_")]
[docs] def execMacro(self, macName, args):
fun = self.__findMacro(macName)
try:
return fun(*args)
except TypeError:
raise utils.logOldExc(MacroError(
"Invalid macro arguments to \\%s: %s"%(macName, args), macName,
hint="You supplied too few or too many arguments"))
except utils.Error:
raise
except Exception as msg:
argRepr = "}{".join(utils.safe_str(a) for a in args)
if argRepr:
argRepr = "{%s}"%argRepr
raise utils.logOldExc(MacroError(
"While expanding macro \\%s%s: %s"%(macName, argRepr, msg),
macName,
hint="This means that the code dealing with your arguments"
" was throroughly confused by what you passed. If you really"
" cannot see why it was, file a bug."))
[docs] def getExpander(self):
try:
return self.__macroExpander
except AttributeError:
self.__macroExpander = MacroExpander(self)
return self.getExpander()
[docs] def expand(self, stuff):
return self.getExpander().expand(stuff)
[docs] def macro_quote(self, arg):
"""returns the argument in quotes (with internal quotes backslash-escaped
if necessary).
"""
return '"%s"'%(arg.replace('"', '\\"'))
[docs] def macro_sqlquote(self, arg):
"""returns the argument as a quoted string, unless it is 'NULL' or
None, in which case just NULL is returned.
"""
if arg is None or arg=='NULL':
return "NULL"
return "'%s'"%arg.replace("'", "''")
[docs] def macro_sql_standardPubDID(self, fromCol="accref"):
"""returns a SQL expression returning a DaCHS standard pubDID generated
from the accref (or something overridden) column.
This is convenient in obscore or ssa views when the underlying table
just has accrefs. If your code actually uses the pubDID to search
in the table (and it probably shouldn't), better use an actual column
and index it.
"""
auth = config.get("ivoa", "authority")
return "'ivo://%s/~?' || gavo_urlescape(%s)"%(
auth.replace("'", "''"),
fromCol)
[docs] def macro_reSub(self, pattern, replacement, string):
"""returns the string with the python RE pattern replaced with
replacement.
This is directly handed through to python re.sub, so you can (but
probably shouldn't) play all the RE tricks you can in python (e.g.,
back references).
If you find yourself having to use reSub, you should regard that as
an alarm sign that you're probably doing it wrong.
Oh: closing curly braces can be included in the argument by
backslash-escaping them.
"""
return re.sub(pattern, replacement, string)
[docs]class StandardMacroMixin(MacroPackage):
"""is a mixin providing some macros for scripting's MacroExpander.
The class mixing in needs to provide its resource descriptor in the
rd attribute.
"""
[docs] def macro_magicEmpty(self, val):
"""returns __EMPTY__ if val is empty.
This is necessary when feeding possibly empty params from mixin
parameters (don't worry if you don't understand this).
"""
if val:
return val
else:
return "__EMPTY__"
[docs] def macro_rdId(self):
"""the identifier of the current resource descriptor.
"""
return self.rd.sourceId
[docs] def macro_rdIdDotted(self):
"""the identifier for the current resource descriptor with slashes replaced
with dots (so they work as the "host part" in URIs.
"""
return self.rd.sourceId.replace("/", ".")
[docs] def macro_schema(self):
"""the schema of the current resource descriptor.
"""
return self.rd.schema
[docs] def macro_resdir(self):
"""the input-relative resource directory of the current resource
descriptor.
This never has a trailing slash.
"""
return self.rd.getRelResdir().rstrip("/")
[docs] def macro_RSTservicelink(self, serviceId, title=None):
"""a link to an internal service; id is <rdId>/<serviceId>/<renderer>,
title, if given, is the anchor text.
The result is a link in the short form for restructured test.
"""
if title is None:
title = serviceId
return "`%s <%s>`_"%(title, osinter.makeSitePath(serviceId))
[docs] def macro_RSTtable(self, tableName):
"""adds an reStructured test link to a tableName pointing to its table
info.
"""
return "`%s <%s>`_"%(tableName,
osinter.makeSitePath("tableinfo/%s"%tableName))
[docs] def macro_internallink(self, relPath):
"""an absolute URL from a path relative to the DC root.
"""
return osinter.makeAbsoluteURL(relPath, canonical=True)
[docs] def macro_urlquote(self, string):
"""wraps urllib.quote.
"""
return urllib.parse.quote(string)
[docs] def macro_today(self):
"""today's date in ISO representation.
"""
return str(datetime.date.today())
[docs] def macro_getConfig(self, section, name=None):
"""the current value of configuration item {section}{name}.
You can also only give one argument to access settings from the
general section.
"""
if name is None:
section, name = "general", section
val = config.get(section, name)
if isinstance(val, str):
return val
else:
return str(val)
[docs] def macro_upper(self, aString):
"""returns aString uppercased.
There's no guarantees for characters outside ASCII.
"""
return aString.upper()
[docs] def macro_lower(self, aString):
"""returns aString lowercased.
There's no guarantees for characters outside ASCII.
"""
return aString.lower()
[docs] def macro_decapitalize(self, aString):
"""returns aString with the first character lowercased.
"""
if aString:
return aString[0].lower()+aString[1:]
[docs] def macro_test(self, *args):
"""always "test macro expansion".
"""
return "test macro expansion"
[docs]class MacDef(structure.Structure):
"""A macro definition within an RD.
The macro defined is available on the parent; macros are expanded
within the parent (behaviour is undefined if you try a recursive expansion).
"""
name_ = "macDef"
_name = attrdef.UnicodeAttribute("name", description="Name the macro"
" will be available as", copyable=True, default=utils.Undefined)
_content = structure.DataContent(description="Replacement text of the"
" macro")
[docs] def validate(self):
super().validate()
if len(self.name)<2:
raise common.LiteralParseError("name", self.name, hint=
"Macro names must have at least two characters.")
[docs] def onElementComplete(self):
super().onElementComplete()
self.content_ = self.parent.expand(self.content_)
def mac():
return self.content_
setattr(self.parent, "macro_"+self.name, mac)
[docs]def MacDefAttribute(**kwargs):
return complexattrs.StructListAttribute("macDefs", childFactory=MacDef,
**kwargs)