Source code for pysys.config.descriptor

#!/usr/bin/env python
# PySys System Test Framework, Copyright (C) 2006-2022 M.B. Grieve

# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.

# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# Lesser General Public License for more details.

# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""
The `TestDescriptor <pysys.config.descriptor.TestDescriptor>` class holds metadata for each testcase 
(``pysystest.*``) or directory (``pysysdirconfig.xml``), and the `DescriptorLoader <pysys.config.descriptor.DescriptorLoader>` 
class allows customization of the test discovery process. 
"""

from __future__ import print_function
import os.path, logging, xml.dom.minidom
import collections
import copy
import locale
import inspect
import importlib
import time

import pysys
from pysys.constants import *
from pysys.exceptions import UserError
from pysys.utils.fileutils import toLongPathSafe, fromLongPathSafe, pathexists
from pysys.utils.pycompat import isstring

log = logging.getLogger('pysys.config.descriptor')

[docs]class TestDescriptor(object): """Descriptor metadata for an individual testcase (``pysystest.*``) or defaults for tests under a directory subtree (``pysysdirconfig.xml``); see :doc:`/pysys/TestDescriptors`. The `DescriptorLoader` class is responsible for determining the available descriptor instances. :ivar str ~.file: The absolute path of the testcase descriptor file. :ivar str ~.testDir: The absolute path of the test, which is used to convert any relative paths into absolute paths. :ivar str ~.id: The testcase identifier, or the id prefix if this is a directory config descriptor rather than a testcase descriptor. Includes a mode suffix if this is a multi-mode test. :ivar str ~.idWithoutMode: The raw testcase identifier with no mode suffix. :ivar str ~.type: The kind of test this is (``auto`` or ``manual``) :ivar str ~.skippedReason: If set to a non-empty string, indicates that this testcase is skipped and provides the reason. If this is set then the test is skipped regardless of the value of `state`. :ivar str ~.state: The state of the testcase (runnable, deprecated or skipped). This field is deprecated - we recommend using `skippedReason` instead, which provides a descriptive outcome to explain why. :ivar str ~.title: The one-line title summarizing this testcase. :ivar str ~.purpose: A detailed description of the purpose of the testcase. :ivar list[str] ~.groups: A list of the user defined groups the testcase belongs to. :ivar list[TestMode] ~.modes: A list of the user defined modes the testcase can be run in. :ivar TestMode ~.mode: Specifies which of the possible modes this descriptor represents or None if the the descriptor has no modes. This field is only present after the raw descriptors have been expanded into multiple mode-specific descriptors. Note that after a descriptor is created from the on-disk file, the `mode` attribute is not set until the later phase when multi-mode descriptors are cloned and expanded based on the selected modes. You can use ``descriptor.mode.params`` to get the parameter dictionary for this mode, and ``descriptor.mode.isPrimary`` to find out of this is a primary mode. :ivar str ~.classname: The Python classname to be executed for this testcase. :ivar str ~.module: The path to the python module containing the testcase class. Relative to testDir, or an absolute path. If not set, the class is looked up in the PYTHONPATH. :ivar str ~.input: The path to the input directory of the testcase. Relative to testDir, or an absolute path. :ivar str ~.output: The path to the output parent directory of the testcase. Relative to testDir, or an absolute path. :ivar str ~.reference: The path to the reference directory of the testcase. Relative to testDir, or an absolute path. :ivar list ~.traceability: A list of the requirements covered by the testcase, typically keywords or bug/story ids. :ivar list[str] ~.authors: A list of the names or user ids of people who contributed to the test. :ivar str ~.created: The date when the test was created in yyyy-mm-dd format. :ivar float ~.executionOrderHint: A float priority value used to determine the order in which testcases will be run; higher values are executed before low values. The default is 0.0. :ivar bool ~.isDirConfig: True if this is a directory configuration, or False if it's a normal testcase. :ivar dict[str,obj] ~.userData: A Python dictionary that can be used for storing user-defined data in the descriptor. In a pysystest.py, this can be populated by a ``__pysys_user_data__`` dictionary, e.g. ``__pysys_user_data__ = {"key": "val ${projectProperty}"}`` or ``__pysys_user_data.key__ = "val"``. """ __slots__ = 'isDirConfig', 'file', 'testDir', 'id', 'type', 'state', 'title', 'purpose', 'groups', 'modes', 'mode', \ 'classname', 'module', 'input', 'output', 'reference', 'traceability', 'executionOrderHint', 'executionOrderHintsByMode', \ 'authors', 'created', \ 'skippedReason', 'idWithoutMode', '_defaultSortKey', 'userData', '_makeTestTemplates', '_descriptorLoaderPlugins', def __init__(self, file, id, type="auto", state="runnable", title=u'', purpose=u'', groups=[], modes=[], classname=DEFAULT_TESTCLASS, module=DEFAULT_MODULE, input=DEFAULT_INPUT, output=DEFAULT_OUTPUT, reference=DEFAULT_REFERENCE, traceability=[], executionOrderHint=0.0, skippedReason=None, authors=[], created=None, testDir=None, isDirConfig=False, userData=None ): self.isDirConfig = isDirConfig if not isDirConfig: assert file, [file, id] self.testDir = fromLongPathSafe(testDir or os.path.dirname(file)) self.file = file self.setId(id) if skippedReason: state = 'skipped' if state=='skipped' and not skippedReason: skippedReason = '<unknown skipped reason>' self.type = type self.state = state self.title = title self.purpose = purpose # copy groups/modes so we can safely mutate them later if desired self.groups = list(groups) if len(modes)>0 and any(not isinstance(m, TestMode) for m in modes): # simple strings were passed in; convert them modes = [(m if isinstance(m, TestMode) else TestMode(m)) for m in modes] else: modes = list(modes) if len(modes)>0 and (not any(m.isPrimary for m in modes)): modes = [TestMode(modes[0], isPrimary=True, params=modes[0].params)]+modes[1:] self.modes = modes self.authors = authors self.created = created if created and not re.match('[0-9][0-9][0-9][0-9]-[0-9][0-9]-[0-9][0-9]$', created): raise UserError('Invalid created date "%s", must be yyyy-mm-dd format, in file "%s"'%(created, file)) self.classname = classname assert classname, 'Test descriptors cannot set the classname to nothing' if not module: self.module = None elif module.endswith('.py') or module == 'PYTHONPATH': self.module = module else: self.module = module+'.py' self.input = input self.output = fromLongPathSafe(output) # just in case descriptors were loaded dynamically and contain absolute \\?\ paths on windows self.reference = reference self.traceability = traceability self.executionOrderHint = executionOrderHint self.skippedReason = skippedReason # NB: self.mode is set after construction and # cloning for each supported mode self.userData = collections.OrderedDict() if userData is None else userData
[docs] def setId(self, id): """ Change the id of this descriptor. This can be used by `DescriptorLoader` or a loader plugin to modify the id of a descriptor just after it has been parsed. Use this insteaad of assigning directly to the id field. :return: Returns ``self`` to allow fluent usage. """ self.id = id self.idWithoutMode = self.id # for internal use only (we cache this to speed up sorting based on path), # and only for tests not dir configs; # convert to lowercase to ensure a canonical sort order on case insensitive OSes; # add id to be sure they're unique (e.g. including mode) if self.file: self._defaultSortKey = self.file.lower()+'/'+self.id return self
def _getTestFile(self): # undocumented API currently # Gets the file containing the test logic - typically a .py file, but could be some other format e.g. .java (but not XML) # Usually relative to testDir, but may be an absolute path if self.file.endswith('.xml') and self.module and self.module != 'PYTHONPATH': return self.module if self.file.startswith(self.testDir): return self.file[len(self.testDir)+1:] return self.file def _createDescriptorForMode(self, mode): """ Internal API for creating a test descriptor for a specific mode of this test. :meta private: """ assert mode, 'Mode must be specified' assert not hasattr(self, 'mode'), 'Cannot create a mode descriptor from a descriptor that already has its mode set' newdescr = copy.deepcopy(self) # nb: the mode can't be deep copied accurately but of course it's not set yet so no problem! newdescr.mode = mode # we assume the passed in mode is the TestMode object (not just a str) if TestMode is what's in the descriptor newdescr.id = self.id+'~'+mode newdescr._defaultSortKey = self._defaultSortKey+'~'+mode return newdescr
[docs] def toDict(self): """Converts this descriptor to an (ordered) dict suitable for serialization.""" d = collections.OrderedDict() d['id'] = self.id d['testDir'] = self.testDir d['descriptorFile'] = self.file d['type'] = self.type d['state'] = self.state d['skippedReason'] = self.skippedReason d['title'] = self.title d['purpose'] = self.purpose d['groups'] = self.groups d['authors'] = self.authors d['created'] = self.created def modeParamsDict(m): x = m.params if m.isPrimary: x = dict(x) x['isPrimary'] = True return x d['modes'] = {str(m):modeParamsDict(m) for m in self.modes} if hasattr(self, 'mode'): d['mode'] = self.mode d['requirements'] = self.traceability # this is always a list with at least one item, or more if there are multiple modes d['executionOrderHint'] = (self.executionOrderHintsByMode if hasattr(self, 'executionOrderHintsByMode') else [self.executionOrderHint]) d['classname'] = self.classname d['module'] = self.module d['input'] = self.input d['output'] = self.output d['reference'] = self.reference d['userData'] = self.userData return d
def __str__(self): """Return an informal string representation of the xml descriptor container object :return: The string represention :rtype: string """ # Some of these are only worth printing when there's actually something to show, and for legacy things like # type/state, when a non-default value is selected s= "Test id: %s\n" % self.id reltestdir = self.testDir if not self.isDirConfig else '' # relative to current dir is most useful if reltestdir.lower().replace('\\','/').startswith(os.getcwd().lower().replace('\\','/')+'/'): reltestdir = reltestdir[len(os.getcwd())+1:] s=s+"Test directory: %s\n" % reltestdir # use OS slashes to facilitate copy+paste if self.type != 'auto': s=s+"Test type: %s\n" % self.type if self.state != 'runnable' and not self.skippedReason: s=s+"Test state: %s\n" % self.state if self.skippedReason: s=s+"Test skip reason: %s\n" % self.skippedReason s=s+"Test title: %s\n" % self.title if self.purpose: s=s+"Test purpose: " purpose = self.purpose.split('\n') for index in range(0, len(purpose)): if index == 0: s=s+"%s\n" % purpose[index] if index != 0: s=s+" %s\n" % purpose[index] if self.created or self.authors: s=s+"Test created: %s; authors: %s\n" % (self.created or '?', ', '.join(self.authors)) s=s+"Test groups: %s\n" % (u', '.join((u"'%s'"%x if u' ' in x else x) for x in self.groups) or u'<none>') def modeNameToString(m): x = "'%s'"%m if ' ' in m else m return x modeDelim = '\n --> ' if any(getattr(m, 'params', None) for m in self.modes) else ', ' longestmode = max(len(modeNameToString(m)) for m in self.modes) if self.modes else 0 def modeToString(m): x = modeNameToString(m) if modeDelim != ', ': x = ("%-"+str(longestmode+1)+"s")%x if getattr(m, 'params', None): x += '{%s}'%', '.join('%s=%r'%(k,v) for (k,v) in m.params.items()) if getattr(m, 'isPrimary', False) and len(self.modes)>1: x=x+' [PRIMARY]' return x.strip() if getattr(self, 'mode',None): # multi mode per run s=s+"Test mode: %s\n" % modeToString(self.mode) else: # print available modes instead s=s+("Test modes: %s%s\n") % (modeDelim if '\n' in modeDelim else '', modeDelim.join(modeToString(x) for x in self.modes) or u'<none>') s=s+"Test order hint: %s\n" % ( u', '.join('%s'%hint for hint in self.executionOrderHintsByMode) # for multi-mode tests if hasattr(self, 'executionOrderHintsByMode') else self.executionOrderHint) s=s+"Test classname: %s; module: %s\n" % (self.classname, self.module) if self.input not in [DEFAULT_INPUT, '.', '!Input_dir_if_present_else_testDir!', '!INPUT_DIR_IF_PRESENT_ELSE_TEST_DIR!']: s=s+"Test input: %s\n" % self.input if self.output != DEFAULT_OUTPUT: s=s+"Test output: %s\n" % self.output if self.reference != DEFAULT_REFERENCE: s=s+"Test reference: %s\n" % self.reference if self.traceability: s=s+"Test traceability: %s\n" % (u', '.join((u"'%s'"%x if u' ' in x else x) for x in self.traceability) or u'<none>') if self.userData: s=s+"Test user data: %s\n" % ', '.join('%s=%s'%(k,self.__userDataValueToString(v)) for k,v in (self.userData.items())) s=s+"" return s @staticmethod def __userDataValueToString(v): if not isstring(v): return str(v) if '\n' in v: # tab and newline character are difficult to read and in most cases whitespace will be stripped out so remove # it from this view of the strings v = '<nl>'.join(x.strip() for x in v.split('\n') if x.strip()) return repr(v).lstrip('u') def __repr__(self): return str(self)
XMLDescriptorContainer = TestDescriptor """ XMLDescriptorContainer is an alias for the TestDescriptor class, which exists for compatibility reasons only. :meta private: """
[docs]class TestModesConfigHelper: """ A helper class that is passed to the lambda which defines test modes in a pysystest configuration. It provides access to the list of inherited modes, to project properties and also helper functions for combining multiple mode lists into one and for configuring a collection of modes as primary modes. See :doc:`/pysys/UserGuide` for detailed information about what you can do with PySys modes. :ivar list[dict[str,obj]] ~.inheritedModes: A list of the inherited modes, each defined by a dictionary containing a ``mode`` key and any number of additional parameters. :ivar ~.constants: A reference to `pysys.constants` which can be used to access constants such as ``IS_WINDOWS`` for platform-dependent mode configuration. :ivar ~.pysys: A reference to the `pysys` module. :ivar callable[str] import_module: A reference to the Python ``importlib.import_module`` function that can be used if you need to access functions from additional modules such as ``sys``, ``re``, etc. :ivar pysys.config.project.Project ~.project: The project configuration, from which you can read properties. :ivar str ~.testDir: The test directory, i.e. the directory containing the ``pysystest.*`` file where this modes configuration is defined. This is not available when defining modes in ``pysysdirconfig``, but only when the mode configuration is directly in the ``pysystest.*`` file. """ def __init__(self, inheritedModes, project, testDir): self.inheritedModes = inheritedModes self.project = project self.constants = pysys.constants self.import_module = importlib.import_module self.pysys = pysys self.os = os self.testDir = testDir
[docs] def makeAllPrimary(self, modes): """ Modifies the specified list (or dict) of modes so that all of them have isPrimary=True. By default only the first mode in the mode list is "primary", so the test will only run in that one mode by default during local development (unless you supply a ``--modes`` or ``--ci`` argument). This is optimal when using modes to validate the same behaviour/conditions in different execution environments e.g. browsers/databases etc. However when using modes to validate different *behaviours/conditions* (e.g. testing out different command line options) using a single PySysTest class, then you should have all your modes as "primary" as you want all of them to execute by default in a quick local test run. You would typically combine test-specific behaviour modes with any inherited execution environment modes like this:: lambda modes: modes.createModeCombinations( helper.inheritedModes, helper.makeAllPrimary( { 'Usage': {'cmd': ['--help'], 'expectedExitStatus':'==0'}, 'BadPort': {'cmd': ['--port', '-1'], 'expectedExitStatus':'!=0'}, 'MissingPort': {'cmd': [], 'expectedExitStatus':'!=0'}, }, ) :param list[dict[str,obj]]|dict[str,dict[str,obj]] modes: A list or dict of modes to be made primary. :return: A list[dict[str,obj]] containing the modes, each with isPrimary set to true. """ if isinstance(modes, dict): modes = [{**{'mode':k}, **v} for k, v in modes.items()] for m in modes: m['isPrimary'] = True return modes
[docs] def createModeCombinations(self, *dimensions): """ Generates a mode list containing all the combinations from each mode list passed into the function. For example, you could combine a list of inherited modes (defined in parent directories' ``pysysdirconfig.xml`` files), with a second dimension containing modes for each database you want to test with and a third dimension with modes for each web browser. The result would be a single (flat) list containing modes, with names and parameter dictionaries automatically merged together from each input dimension:: lambda helper: helper.createModeCombinations( helper.inheritedModes, { 'MySQL': {'db': 'MySQL', 'dbTimeoutSecs':60}, 'SQLite': {'db': 'SQLite', 'dbTimeoutSecs':120}, 'Mock': {'db': 'Mock', 'dbTimeoutSecs':30}, }, # can use dict or list format for each mode list, whichever is more convenient: [ {'browser':'Chrome'}, # if mode is not explicitly specified it is auto-generated from the parameter(s) {'browser':'Firefox'}, ] ) would generate a list of modes named:: MySQL_Chrome MySQL_Firefox SQLite_Chrome SQLite_Firefox Mock_Chrome Mock_Firefox NB: By default the first mode in each dimension is designated a *primary* mode (one that executes by default when no ``--modes`` or ``--ci`` argument is specified), but this can be overridden by setting ``'isPrimary': True/False`` in the dict for any mode. When mode dimensions are combined, the primary modes are AND-ed together, i.e. any where *all* mode dimensions will be designated primary. So in the above case, since MySQL and Chrome are automatically set as primary modes, the MySQL_Chrome mode would be the (only) primary mode returned from this function. When using modes for different execution environments/browsers etc you probably want only the first (typically fastest/simplest/most informative) mode to be primary; on the other hand if using modes to re-use the same PySysTest logic for against various behavioural tests (different input files/args etc) you should usually set all of the modes to be primary so that all of them are executed in your test runs during local development. A common use case is to combine inherited modes from the parent pysysdirconfigs with a list of modes specific to this test:: lambda helper: helper.createModeCombinations( helper.inheritedModes, helper.makeAllPrimary( { 'Usage': {'cmd': ['--help'], 'expectedExitStatus':'==0', 'expectedMessage':None}, 'BadPort': {'cmd': ['--port', '-1'], 'expectedExitStatus':'!=0', 'expectedMessage':'Server failed: Invalid port number specified: -1'}, 'SetPortTwice': {'cmd': ['--port', '123', '--config', helper.testDir+'/myserverconfig.json'], 'expectedExitStatus':'!=0', 'expectedMessage':'Server failed: Cannot specify port twice'}, }), ) For simplicity this common case can be expressed with the more concise syntax:: __pysys_parameterized_test_modes__ = { 'Usage': {'cmd': ['--help'], 'expectedExitStatus':'==0'}, 'BadPort': {'cmd': ['--port', '-1'], 'expectedExitStatus':'!=0'}, 'MissingPort': {'cmd': [], 'expectedExitStatus':'!=0'}, } NB: For efficiency reasons, don't use the ``createModeCombinations`` method in your configuration if you are *just* using the inherited modes unchanged. :param list[dict[str,obj]]|dict[str,dict[str,obj]] dimensions: Each argument passed to this function is a list of modes, each mode defined by a dict which may contain a ``mode`` key plus any number of parameters. Alternatively, each dimension can be a dict where the mode is the key and the value is a parameters dict. :return: A list[dict[str,obj]] containing the flattened list of modes consisting of all combinations of the passed in. Mode names and parameter dictionaries will be merged. For example: ``[{"mode":"MyMode", "param1":100}, {"mode": "myMode2", "param1":200}]``. The returned list can be further manipulated using Python list comprehensions (e.g. to exclude certain combinations) if desired. .. versionadded:: 2.1 """ if len(dimensions) == 1: return dimensions[0] current = {} # key=mode name value=params for dimension in dimensions: prevModesForCombining = None if not current else current current = {} if isinstance(dimension, dict): dimension = [{**{'mode':k}, **v} for k, v in dimension.items()] for mode in dimension: modeString, params = _XMLDescriptorParser.splitModeNameAndParams(mode, project=self.project) current[modeString] = mode # end for mode # ensure at least one is primary in each dimension, else we'd lose the primary-ness when AND-ing them together if current and not any(m.get('isPrimary', False) for m in current.values()): next(iter(current.values()))['isPrimary'] = True if prevModesForCombining is not None: if not current or not prevModesForCombining: current = prevModesForCombining or current else: newModes = current current = {} for modeA, paramsA in prevModesForCombining.items(): for modeB, paramsB in newModes.items(): isPrimary = paramsA.get('isPrimary', False) and paramsB.get('isPrimary', False) params = dict(paramsA) params.update(paramsB) # newer "B" params take precedence if any keys as the same # for simplicity, just include it with params here params['isPrimary'] = isPrimary current[modeA.strip('_')+'_'+modeB.strip('_')] = params return [{**{'mode':modeString}, **params} for modeString, params in current.items()]
[docs] def combineModeDimensions(self, *dimensions): """ Old name for the `createModeCombinations` method. """ return self.createModeCombinations(*dimensions)
[docs]class TestMode(str): # subclasses string to retain compatibility for tests that don't use mode parameters """Represents a mode that a test can run in in a `TestDescriptor`, and optionally a dict of parameters that define that mode. To create one:: mode = TestMode('MyMode', {'param1': 'value1'}) See the ``mode`` parameter/field in `TestDescriptor` where this class is used. This class is immutable, so create a new instance if you want to change something. The mode values can be of any type as long as it is pickleable (see Python's `pickle` module for more information). Standard Python types like strings, dicts etc are fine. For convenience and compatibility, this TestMode subclasses a string holding the mode. :ivar str ~.name: The name of the mode as a string. :ivar dict[str,obj] ~.params: A dictionary of parameters associated with this mode. The parameters are available to the test (as ``self.mode.params``) and also assigned as instance fields on the test class when it runs in this mode. :ivar bool ~.isPrimary: Indicates whether this is a primary mode, one that executes by default even when not explicity requested with a command line option such as ``--modes=ALL``. .. versionadded:: 2.0 """ __slots__ = ['__params', '__isPrimary', '__name'] def __new__(cls,s,params=None, isPrimary=False): self = str.__new__(cls,s) self.__name = s if params is None: params = {} self.__params = params assert 'isPrimary' not in params, repr(params) self.__isPrimary = isPrimary return self @property def params(self): return self.__params @property def isPrimary(self): return self.__isPrimary @property def name(self): return self.__name def __repr__(self): return self.name+str(self.__params)+('[PRIMARY]' if self.__isPrimary else '')
class _XMLDescriptorParser(object): '''NOT PUBLIC API - use L{DescriptorLoader._parseTestDescriptor} instead. :meta private: Helper class to parse an XML test descriptor - either for a testcase, or for defaults for a (sub-)directory of testcases. If the file is/contains XML the class uses the minidom DOM (Document Object Model) non-validating parser to provide accessor methods to return element attributes and character data from the test descriptor file. The class is instantiated with the filename of the test descriptor. It is the responsibility of the user of the class to call the unlink() method of the class on completion in order to free the memory used in the parsing. If not, it uses __pysys_XXX__ dunders (Python-style but also designed to work fine in other languages whether in comments e.g. /* ... */ or even as string literals, provided there are no backslash escapes to worry about). :param bytes fileContents: Used only for testing purposes - to measure load times without any disk activity. ''' KV_PATTERN = '__pysys_%s__' __IMPORT_EXPR = b'\nimport ' if os.linesep.endswith('\n') else b'\rimport ' # the former works for windows+linux (regardless of ending), the latter for mac __PYTHON_PYSYS_DUNDER_EXPR = b'\n__pysys_' if os.linesep.endswith('\n') else b'\r__pysys_' __DISABLE_PYTHON_DESCRIPTOR_PARSING = os.getenv('PYSYS_DISABLE_PYTHON_DESCRIPTOR_PARSING','').lower()=='true' # undocumented, just for testing parseTimeXML = 0.0 parseTimePython = 0.0 def __init__(self, xmlfile, istest=True, parentDirDefaults=None, project=None, xmlRootElement=None, fileContents=None): assert project self.file = xmlfile if len(xmlfile) < 256: self.file = fromLongPathSafe(self.file)# used for error messages etc self.dirname = os.path.dirname(xmlfile) self.istest = istest self.defaults = (project._defaultDirConfig or self.DEFAULT_DESCRIPTOR) if parentDirDefaults is None else parentDirDefaults roottag = 'pysystest' if istest else 'pysysdirconfig' if not os.path.exists(xmlfile): raise UserError("Unable to find supplied descriptor \"%s\"" % self.file) self.project = project self.kvDict = {} if xmlRootElement: # used when parsing from project XML rather than directly from a standalone file self.doc = None self.root = xmlRootElement assert xmlRootElement.tagName == 'pysysdirconfig', xmlRootElement.tagName return starttime = time.monotonic() if istest and not xmlfile.endswith('.xml'): if fileContents is None: # Open in binary mode since we don't know the encoding - we'll rely on the XML header and/or Python header to tell us if it's anything unusual with open(xmlfile, 'rb') as xmlhandle: fileContents = xmlhandle.read() # Find it within a file of another type e.g. pysystest.py if xmlfile.endswith('.py') and not _XMLDescriptorParser.__DISABLE_PYTHON_DESCRIPTOR_PARSING: # NB Doing a full python parse, ignoring the import statements onwards, is up to 14% faster(!) # (for large size/complexity) than the regex approach - and of course more idiomatic for Python developers pythonHeader = fileContents # Optimize for speed (and to reduce unnecessary failures) by stripping out everything from the imports onwards # assume platform native line endings, for performance reasons - if incorrect, just means we miss the perf optimization # decent speed up from not using regex's here # we could also search for "from XXX import ..." but that's harder to match without regex's so don't bother as it would slow down the common case firstImportIndex = pythonHeader.find(_XMLDescriptorParser.__IMPORT_EXPR) # the first "\nimport " is a pretty clear sign of the imports beginning # nb: give up on optimization if there are "__pysys_" lines below the imports if firstImportIndex > 0 and _XMLDescriptorParser.__PYTHON_PYSYS_DUNDER_EXPR not in fileContents[firstImportIndex:]: pythonHeader = pythonHeader[:firstImportIndex] runpycode = compile(pythonHeader, xmlfile, 'exec') runpy_namespace = {} exec(runpycode, runpy_namespace) for k in runpy_namespace: if k.startswith('__pysys_'): if not k.endswith('__'): raise UserError(f'Incorrect key format for "{k}" (should end with "__") in "{self.file}"') self.kvDict[k[len('__pysys_'):].rstrip('_')] = runpy_namespace[k] del runpy_namespace else: # non-Python files, fall back to a general purpsoe Python-like syntax # must be at the start of a line, i.e. not after a comment # we do allow raw strings for m in re.finditer( (f'^[ \\t]*{self.KV_PATTERN.rstrip("__")%"(?P<key>[^ =]+)"} *= *(?:(?P<rawstring>[r@])?(' # r for python raw strings, @ for C# +'|'.join([ '(?P<value1>(-?[0-9+-][0-9.]+|[T]rue|[F]alse))', # number/boolean literal, would be a shame for it to have to be quoted '"""(?P<value2>(?:[^"]|"{1,2}(?!"))*)"""', '"(?P<value3>[^"]*)"', ]) +') *($|[;#\\n\\r]))?' # ensure there's no attempt to concatenate something else; we make the string matching part optional so we can give a nice error if it goes wrong ).encode('ascii'), fileContents, flags=re.DOTALL + re.MULTILINE): k = m.group('key').decode('ascii', errors='replace') if not k.endswith('__'): raise UserError(f'Incorrect key format for "{self.KV_PATTERN.rstrip("_") % k}" in "{self.file}"') k = k.rstrip('_') if k in self.kvDict: raise UserError('Duplicate key "{self.KV_PATTERN % k}__" in "{self.file}"') value = m.group('value1') or m.group('value2') or m.group('value3') if value is None: raise UserError(f'Cannot parse the value for {self.KV_PATTERN % k} in {self.file}; after the "=" you should use r"""...""", "..." or a numeric/boolean literal') if (not m.group('rawstring')) and b'\\' in value: raise UserError(f'Cannot use backslash escape sequences for {self.KV_PATTERN % k} value (unless using a raw r"""...""" string); cannot parse "{self.file}"') if k != 'xml_descriptor': # we keep xml descriptors as bytes so we can use the correct encoding value = value.decode('utf-8', errors='replace') self.kvDict[k] = value if 'title' not in self.kvDict and 'xml_descriptor' not in self.kvDict: raise UserError(f'Cannot find mandatory {self.KV_PATTERN % "title"} specifier for this test in {self.file} (found: {list(self.kvDict.keys())})') xmlcontents = self.kvDict.pop('xml_descriptor', '').strip() # not likely to be used for .py files, but might be nice for some others else: xmlcontents = fileContents # usually None, unless this is a microbenchmark performance test try: if xmlcontents: self.doc = xml.dom.minidom.parseString(xmlcontents) elif xmlcontents == None: self.doc = xml.dom.minidom.parse(xmlfile) else: self.doc = self.root = None return except Exception as ex: raise UserError("Invalid XML in descriptor '%s': %s" % (self.file, ex)) else: if self.doc.getElementsByTagName(roottag) == []: raise UserError("No <%s> element supplied in XML descriptor '%s'"%(roottag, self.file)) else: self.root = self.doc.getElementsByTagName(roottag)[0] if xmlfile.endswith('.xml'): _XMLDescriptorParser.parseTimeXML += time.monotonic()-starttime else: _XMLDescriptorParser.parseTimePython += time.monotonic()-starttime @staticmethod def parse(xmlfile, istest=True, parentDirDefaults=None, project=None, **kwargs): """ Parses the test/dir descriptor in the specified path and returns the TestDescriptor object. :param istest: True if this is a ``pysystest.*`` file, false if it is a descritor giving defaults for a directory of testcases. :param parentDirDefaults: Optional TestDescriptor instance specifying default values to be filtered in from the parent directory. """ p = _XMLDescriptorParser(xmlfile, istest=istest, parentDirDefaults=parentDirDefaults, project=project, **kwargs) try: return p.getContainer() finally: p.unlink() DEFAULT_DESCRIPTOR = TestDescriptor( file=None, id=u'', type="auto", state="runnable", title='', purpose='', groups=[], modes=[], classname=DEFAULT_TESTCLASS, module=None, input=DEFAULT_INPUT, output=DEFAULT_OUTPUT, reference=DEFAULT_REFERENCE, traceability=[], executionOrderHint=0.0, skippedReason=None, isDirConfig=True) """ A directory config descriptor instance of TestDescriptor holding the default values to be used if there is no directory config descriptor. """ def getContainer(self): '''Create and return an instance of TestDescriptor for the contents of the descriptor.''' if self.root: for attrName, attrValue in self.root.attributes.items(): if attrName not in ['state', 'type', 'authors', 'created']: raise UserError('Unknown attribute "%s" in XML descriptor "%s"'%(attrName, self.file)) cls, pymodule = self.getClassDetails() if pymodule is None and self.istest: # default setting means auto-detect (nb: NOT the same as pymodule='' which means to use the PYTHONPATH) if self.file.endswith('.py'): pymodule = os.path.basename(self.file) elif cls and '.' in cls: # if the Python class is X.Y it's probably got a package name and therefore PYTHONPATH (could be a nested class inside a run.py but pretty unlikely) pymodule = 'PYTHONPATH' else: pymodule = DEFAULT_MODULE # else run.py # some elements that are mandatory for an individual test and not used for dir config t = TestDescriptor(self.getFile(), self.getID(), self.getType(), self.getState(), self.getTitle() if self.istest else '', self.getPurpose() if self.istest else '', self.getGroups(), self.getModes(), self.project.expandProperties(cls), self.project.expandProperties(pymodule), self.project.expandProperties(self.getTestInput()), self.project.expandProperties(self.getTestOutput()), self.project.expandProperties(self.getTestReference()), self.getRequirements(), self.getExecutionOrderHint(), skippedReason=self.getSkippedReason(), testDir=self.dirname, userData={k:self.project.expandProperties(v) for k,v in self.getUserData().items()}, authors=[x.strip() for x in (self.kvDict.pop('authors', None) or (self.root.getAttribute('authors') if self.root else '') ).split(',') if x.strip()], created=self.kvDict.pop('created', None) or (self.root.getAttribute('created') if self.root else None) or None, isDirConfig=not self.istest) if self.kvDict and os.getenv('PYSYS_IGNORE_UNKNOWN_DESCRIPTOR_FIELDS','').lower()!='true': # should all have been popped during parsing raise UserError(f'Unknown {self.KV_PATTERN % "KEY"} key(s) in test descriptor "{self.file}": {", ".join(self.kvDict.keys())}') if not self.istest: # not an official/public part of the descriptor spec, so don't have it in the constructor signature t._makeTestTemplates = self._parseTestMakerTemplates() t._descriptorLoaderPlugins = getattr(self.defaults, '_descriptorLoaderPlugins', [])+self._parseDescriptorLoaderPlugins() return t def _parseDescriptorLoaderPlugins(self):# not public API, do not use plugins = [] for node in self.root.getElementsByTagName('descriptor-loader-plugin'): from pysys.config.project import _XMLProjectParser cls, optionsDict = _XMLProjectParser._parseClassAndConfigDictImpl(self.__expandPropertiesImplFromProject, node, defaultClass=None) pluginKey = (cls, tuple(optionsDict.items())) # hashable plugins.append( (pluginKey, cls, optionsDict) ) return plugins def __expandPropertiesImplFromProject(self, value, default, name=None): # hack to allow us to use _parseClassAndConfigDict from here - simulates api of _XMLProjectParser # setting default=None means we can't use <property default="...">" attributes here, but that's a price worth paying at least for now return self.project.expandProperties(value) def _parseTestMakerTemplates(self): # not public API, do not use templates = [] for e in self.root.getElementsByTagName('maker-template'): t = { 'name': e.getAttribute('name'), 'description': e.getAttribute('description'), 'copy': [x for x in (e.getAttribute('copy') or '').split(',') if x.strip()], 'mkdir': None if not e.hasAttribute('mkdir') else [self.project.expandProperties(x).strip() for x in (e.getAttribute('mkdir') or '').split(',') if self.project.expandProperties(x).strip()], 'isTest': (e.getAttribute('isTest') or '').lower() != 'false', 'replace': [], 'source': self.file, } # NB: further validation and expansion happens in console_make if not t['name']: raise UserError("A name=... attribute is required for each maker-template in \"%s\""%self.file) if not t['description']: raise UserError("A description=... attribute is required for each maker-template, in \"%s\""%self.file) for r in e.getElementsByTagName('replace'): r1, r2 = r.getAttribute('regex'), r.getAttribute('with') if not r1 or not r2: raise UserError("Each maker-template <replace> element requires both a regex= and a with= attribute, in \"%s\""%self.file) t['replace'].append( (r1, r2) ) templates.append(t) for e in self.root.getElementsByTagName('set-default-maker-template'): # for ease of processing, set the name to a fixed sentinel value so that the normal template handling logic can apply and the latest one will always override it templates.append({'name':'set-default-maker-template', 'set-default-maker-template': e.getAttribute('name')}) # NB: we don't combine with defaults here, that happens in the make launcher return templates def unlink(self): '''Clean up the DOM on completion.''' if self.doc: self.doc.unlink() def getFile(self): '''Return the filename of the test descriptor.''' return self.file def getID(self): '''Return the id of the test, or for a pysysdirconfig, the id prefix.''' id = self.defaults.id + self.kvDict.pop('id-prefix','')+self.getElementTextOrDefault('id-prefix', default='') for c in u'\\/:~#<>': # reserve a few characters that we might need for other purposes; _ and . can be used however if c in id: raise UserError('The <id-prefix> is not permitted to contain "%s"; error in "%s"'%(c, self.file)) if self.istest: id = id+os.path.basename(self.dirname) return id def getType(self): '''Return the type attribute of the test element - mostly just legacy now.''' if not self.root: return self.defaults.type type = self.root.getAttribute("type") or self.defaults.type if type not in ["auto", "manual"]: raise UserError("The type attribute of the test element should be \"auto\" or \"manual\" in \"%s\""%self.file) return type def getState(self): '''Return the state attribute of the test element - mostly just legacy now.''' if not self.root: return self.defaults.state state = self.root.getAttribute("state") or self.defaults.state if state not in ["runnable", "deprecated", "skipped"]: raise UserError("The state attribute of the test element should be \"runnable\", \"deprecated\" or \"skipped\" in \"%s\""%self.file) return state def getSkippedReason(self): r = self.kvDict.pop('skipped_reason', None) if r is not None: if not r: raise UserError('Missing value for skipped reason in "{self.file}"') return r if self.root: for e in self.root.getElementsByTagName('skipped'): r = (e.getAttribute('reason') or '').strip() # make this mandatory, to encourage good practice if not r: raise UserError('Missing reason= attribute in <skipped> element of "{self.file}"') return r return self.defaults.skippedReason def getTitle(self): # PySys 1.6.1 gave an error if <description> was missing, but a default if <title> was missing, and permitted empty string. So don't be too picky. result = self.kvDict.pop('title', None) or self.getElementTextOrDefault('title', optionalParents=['description']) if result is None and self.istest: result = self.getID() # falling back to the ID is better than nothing result = result.replace('\n',' ').replace('\r',' ').replace('\t', ' ').strip().rstrip('.') if ' ' in result: result = re.sub(' +', ' ', result) if len(result)==0 and self.istest: result = self.getID() # falling back to the ID is better than nothing return result def getPurpose(self): result = self.kvDict.pop('purpose', None) or self.getElementTextOrDefault('purpose', optionalParents=['description']) if result is None: result = self.defaults.purpose if not result: return result return inspect.cleandoc(result.replace('\r','').replace('\t', ' ')).strip() def getGroups(self): groupList = [] groups = self.kvDict.pop('groups', None) if isinstance(groups, str): groups = groups.replace(' ','').split(';') groupList = [g for g in groups[0].split(',') if g] if len(groups) > 1 and groups[1].lower() not in ['inherit=true', 'inherit=false']: raise UserError(f'Invalid inherit= specifier - groups should be in the form "my-group1, mygroup2, ...; inherit=true/false" in descriptor "{self.file}"') if len(groups)>1 and groups[1].lower() == 'inherit=false': return groupList else: groups = self.getSingleElement('groups', optionalParents=['classification']) if groups: if groups.parentNode.tagName not in ['pysystest', 'pysysdirconfig', 'classification']: raise UserError("<groups> element found under <%s> but must be under the root node (or the <classification> node), in XML descriptor \"%s\""%(groups.parentNode.tagName, self.file)) if groups.getAttribute('groups'): groupList.extend(g.strip() for g in groups.getAttribute('groups').split(',') if g.strip()) for node in groups.getElementsByTagName('group'): g = self.getText(node) if g and g.strip(): groupList.append(g.strip()) if (groups.getAttribute('inherit') or 'true').lower()!='true': return groupList # don't inherit groupList = [x for x in self.defaults.groups if x not in groupList]+groupList return groupList @staticmethod def splitModeNameAndParams(mode, project): """ Returns (modename, params). Auto-generates a mode name if one is not already provided. WARNING: The mode dict is mutated by this method. """ if isinstance(mode, TestMode): # just for the parameterized test modes use case modeString = mode.name params = dict(mode.params) params['isPrimary'] = mode.isPrimary mode = params else: assert isinstance(mode, dict), 'Each mode must be a {...} dict but found unexpected object %r (%s)'%(mode, mode.__class__.__name__) modeString = mode.pop('mode', None) if modeString: return modeString, mode # Auto-generate mode string assert len(mode) != 0, 'Must provide a name and/or params for every mode dictionary' modeString = '_'.join( '%s=%s'%(k, v) if (not isinstance(v, str) or re.match('^([-0-9.]+|true|false|)$', v, flags=re.IGNORECASE)) else v # include the key for numeric and boolean values for (k,v) in mode.items() if k != 'isPrimary') modeString = modeString.strip('_') # avoid leading/trailing _'s # Enforce consistent naming convention of initial caps if project.getProperty('enforceModeCapitalization', True): modeString = modeString[0].upper()+modeString[1:] assert modeString, 'Mode name cannot be empty' return modeString, mode def _addParameterizedTestModes(self, base): # base: list(TestMode) parameterized = self.kvDict.pop('parameterized_test_modes', None) if not parameterized: return base assert isinstance(parameterized, list) or isinstance(parameterized, dict), 'Parameterized test modes must be a list or dict of modes, but got: %r'%parameterized helper = TestModesConfigHelper( inheritedModes=[], project=self.project, testDir=os.path.dirname(self.file) if self.istest else None ) return [TestMode(m.pop('mode'), isPrimary=m.pop('isPrimary', False), params=m) for m in helper.createModeCombinations( base, helper.makeAllPrimary(parameterized))] def getModes(self): text = self.kvDict.pop('modes', None) modesNode = None if text is None or text=='': # nb: do NOT handle [] the same as empty string since that's a common pitfall modesNode = self.getSingleElement('modes', optionalParents=['classification']) if modesNode: text = self.getText(modesNode) else: # if we have neither kvText text nor mode return self._addParameterizedTestModes(self.defaults.modes) # by default we inherit if text is None or text=='': # pre-2.0 XML approach result = {} for node in modesNode.getElementsByTagName('mode'): modeString = node.getAttribute('mode') or self.getText(node) if modeString: result[modeString] = {} if (modesNode.getAttribute('inherit') or 'true').lower() == 'true': # This logic is intended to preserve primary inherited modes; it's a bit weird, but keeping it the same for compatibility inherited = [x for x in self.defaults.modes if x not in result] else: inherited = [] result = inherited+[TestMode(k, params=v) for (k,v) in result.items()] if result and not any(m.isPrimary for m in result): result[0] = TestMode(result[0], params=result[0].params, isPrimary=True) return self._addParameterizedTestModes(result) # The modern PySys 2.0+ approach with a Python eval string try: modesLambda = text if isinstance(modesLambda, str): # kvDict may contain non-string values direct from Python # use an empty namespace since if we were parsing this as real python, all import statements would be appearing later modesLambda = pysys.utils.safeeval.safeEval(text.strip(), extraNamespace={}, emptyNamespace=True) assert callable(modesLambda), 'Expecting callable (e.g. lambda helper: [...]) but got %r'%modesLambda helper = TestModesConfigHelper( # note that inheritedModes param dicts may be mutated (so good thing we'd creating a new dict here for the default modes) inheritedModes=[{**mode.params, **{'mode':mode, 'isPrimary':mode.isPrimary}} for mode in self.defaults.modes], project=self.project, testDir=os.path.dirname(self.file) if self.istest else None ) modes = modesLambda(helper) # assumes it's a callable accepting a single parameter if isinstance(modes, dict): modes = [{**{'mode':k}, **v} for k, v in modes.items()] assert isinstance(modes, list), 'Expecting a list of modes, got a %s: %r'%(modes.__class__.__name__, modes) assert not modesNode or not modesNode.hasAttribute('inherit'), 'Cannot use the legacy inherit= attribute when using the modern Python lambda to define modes' # Add parameterized modes before validation modes = self._addParameterizedTestModes(modes) result = [] already = set() expectedparams = None for m in modes: modeString, params = self.splitModeNameAndParams(m, project=self.project) isPrimary = params.pop('isPrimary', False) assert isPrimary in [True, False], 'isPrimary must be set to True or False, not %r'%isPrimary # Eliminate dodgy characters badchars = re.sub('[%s]+'%pysys.launcher.MODE_CHARS,'', modeString) if badchars: log.debug('Unsupported characters "%s" found in test mode "%s" of %s; stripping them out', ''.join(set(c for c in badchars)), modeString, self.file) modeString = re.sub('[^%s]'%pysys.launcher.MODE_CHARS,'', modeString) modeString = modeString.strip().strip('_') # avoid leading/trailing _'s and whitespace, since we'll add them when composing modes assert modeString, 'Invalid mode: cannot be empty' assert '__' not in modeString, 'Invalid mode "%s" cannot contain double underscore'%modeString # Enforce consistent naming convention of initial caps if self.project.getProperty('enforceModeCapitalization', True): modeString = modeString[0].upper()+modeString[1:] assert modeString not in already, 'Duplicate mode "%s"'%modeString already.add(modeString) for p in params: assert not p.startswith('_'), 'Illegal mode parameter name - cannot start with underscore: %s'%p # check that params are the same in each one to avoid mistakes if expectedparams is None: expectedparams = sorted(params.keys()) assert sorted(params.keys()) == expectedparams, f'The same mode parameter keys must be given for every mode in the list, but found {sorted(params.keys())} parameters for "{modeString}" different to {expectedparams}' result.append(TestMode(modeString, isPrimary=isPrimary, params=params)) result = self._addParameterizedTestModes(result) # ensure there's at least one primary mode if result and not any(m.isPrimary for m in result): result[0] = TestMode(result[0], params=result[0].params, isPrimary=True) return result except Exception as ex: log.debug('Invalid modes config: ', exc_info=True) raise UserError("Invalid modes configuration in %s: %s"%(self.file, ex)) def getClassDetails(self): '''Return the Python test class attributes (name, module, searchpath), contained in the class element.''' classname, module = self.kvDict.pop('python_class', None), self.kvDict.pop('python_module', None) el = self.getSingleElement('class', optionalParents=['data']) if el: classname = classname or el.getAttribute('name') module = module or el.getAttribute('module') # nb: empty means look it up in PYTHONPATH, None is a sentinel value meaning auto, based on descriptor extension if module == '': module = 'PYTHONPATH' # probably this is what was intended return [classname or self.defaults.classname, module or self.defaults.module] def getExecutionOrderHint(self): r = self.kvDict.pop('execution_order_hint', None) if r is None: e = self.getSingleElement('execution-order') r = None if e: r = e.getAttribute('hint') if r: try: r = float(r) except Exception: raise UserError('Invalid float value specified for execution order hint in "%s"'%self.file) if r is None or r == '': return self.defaults.executionOrderHint else: return r def getUserData(self): newitems = self.kvDict.pop('user_data', {}) if isinstance(newitems, str): newitems = pysys.utils.safeeval.safeEval(newitems.strip(), extraNamespace={}, emptyNamespace=True) for k in [k for k in self.kvDict if k.startswith('user_data_')]: newitems[k[k.find('data_')+5:]] = self.kvDict.pop(k) for k in [k for k in self.kvDict if k.startswith('user_data.')]: # TODO??? newitems[k[k.find('.')+1:]] = self.kvDict.pop(k) if not newitems: data = self.getSingleElement('data') if data: for e in data.getElementsByTagName('user-data'): key = e.getAttribute('name').strip() # NB: we don't use inspect.cleandoc here since it'd probably slow down descriptor loading and in 99% # of for multi-line strings we will be stripping whitespace anyway so not a good use of time value = e.getAttribute('value') if not value and e.childNodes: value = '\n'.join(n.data for n in e.childNodes if (n.nodeType in {n.TEXT_NODE,n.CDATA_SECTION_NODE}) and n.data) if value is None: value = '' newitems[key] = value for key in newitems: assert key, 'name must be specified for user data' assert key not in {'input', 'output', 'reference', 'descriptor', 'runner', 'log', 'project', 'lock'}, key # prevent names that we reserve for use by the basetest/processuser # start with parent defaults, add children result = dict(self.defaults.userData) result.update(newitems) return result def getTestInput(self): value = self.kvDict.pop('input_dir', None) if value: return value node = self.getSingleElement('input', optionalParents=['data']) or self.getSingleElement('input-dir', optionalParents=['data']) if node: x = node.getAttribute('path') or self.getText(node) if x: return x return self.defaults.input def getTestOutput(self): value = self.kvDict.pop('output_dir', None) if value: return value node = self.getSingleElement('output', optionalParents=['data']) or self.getSingleElement('output-dir', optionalParents=['data']) if node: x = node.getAttribute('path') or self.getText(node) if x: return x return self.defaults.output def getTestReference(self): value = self.kvDict.pop('reference_dir', None) if value: return value node = self.getSingleElement('reference', optionalParents=['data']) or self.getSingleElement('reference-dir', optionalParents=['data']) if node: x = node.getAttribute('path') or self.getText(node) if x: return x return self.defaults.reference def getRequirements(self): '''Return a list of the requirement ids, contained in the character data of the requirement elements.''' reqList = [x.strip() for x in self.kvDict.pop('traceability_ids', '').split(',') if x.strip()] if self.root: for node in self.root.getElementsByTagName('requirement'): if (node.getAttribute('id') or '').strip(): reqList.append(node.getAttribute('id').strip()) # these used to always be below <traceability><requirements>..., but now we allow them directly under the root node # (or anywhere the user wants) reqList = [x for x in self.defaults.traceability if x not in reqList]+reqList return reqList @staticmethod def getText(element): """Utility method that reads text from the specified element and strips leading/trailing whitespace from it. Returns an empty string if none. """ t = u'' if not element: return t for n in element.childNodes: if (n.nodeType in [element.TEXT_NODE, element.CDATA_SECTION_NODE]) and n.data: t += n.data return t.strip() def getSingleElement(self, tagName, parent=None, optionalParents=[]): """Utility method that finds a single child element of the specified name and strips leading/trailing whitespace from it. Returns None if not found. """ if not self.root: return None t = u'' if not parent: parent = self.root nodes = parent.getElementsByTagName(tagName) if len(nodes) == 0: return None if len(nodes) > 1: raise UserError('Expected one element <%s> but found more than one in %s' % (tagName, self.file)) if nodes[0].parentNode.tagName not in ['pysystest', 'pysysdirconfig']+optionalParents: sys.stderr.write("WARNING: XML descriptor element <%s> is not permitted under <%s> of \"%s\"\n"%(tagName, nodes[0].parentNode.tagName, self.file)) sys.stderr.flush() return nodes[0] def getElementTextOrDefault(self, tagName, default=None, parent=None, optionalParents=[]): """Utility method that finds a single child element of the specified name and strips leading/trailing whitespace from it. Returns an empty string if none. """ t = u'' node = self.getSingleElement(tagName, parent=parent, optionalParents=optionalParents) if node is None: return default return self.getText(node) IGNORED_PYSYSTEST_SUFFIXES = tuple( (os.getenv('PYSYS_IGNORED_PYSYSTEST_SUFFIXES', '')+',~,.tmp,.bak,.swp,.orig').strip(',').replace(' ','').split(',') ) """ A tuple listing ``pysystest.*`` suffixes that will be ignored due to being temporary/backup/swap files for common editors and IDEs. The list can be extended by setting the ``PYSYS_IGNORED_PYSYSTEST_SUFFIXES`` environment variable to a comma-separated list of additional extensions. """
[docs]class DescriptorLoader(object): """ This class is responsible for locating and loading all available testcase descriptors. A custom DescriptorLoader subclass can be provided to customize the test discovery process, typically by overriding L{loadDescriptors} and modifying the returned list of descriptors and configuring your ``pysysproject.xml`` with:: <descriptor-loader module="mypkg.custom" classname="CustomDescriptorLoader"/> You could use this approach to add additional descriptor instances to represent non-PySys testcases found under the search directory, for example based on discovery of unit test classes. Another key use case would be dynamically adding or changing descriptor settings such as the list of modes for each testcase or the executionOrderHint, perhaps based on a per-group basis. For example, you could modify descriptors in the "database-tests" group to have a dynamically generated list of modes identifying the possible database servers supported without having to hardcode that list into any descriptor files on disk, and allowing for different database modes on different platforms. This class may use multi-threading to improve performance, so any extensions must be thread-safe. :ivar pysys.config.project.Project ~.project: The `pysys.config.project.Project` instance. """ def __init__(self, project, **kwargs): assert project, 'project must be specified' self.project = project # Import these since they _could_ be needed when parsing pysystest.py descriptors import pysys.baserunner import pysys.basetest self.__descriptorPluginCache = {}
[docs] def loadDescriptors(self, dir, **kwargs): """Find all descriptors located under the specified directory (including its children), and return them as a list. Subclasses may change the returned descriptors and/or add additional instances of their own to the list after calling the super implementation:: descriptors = super().loadDescriptors(dir, **kwargs) ... return descriptors :param dir: The parent directory to search for runnable tests. :return: List of L{pysys.config.descriptor.TestDescriptor} objects which could be selected for execution. If a test can be run in multiple modes there must be a single descriptor for it in the list returned from this method. Each multi-mode descriptor is later expanded out into separate mode-specific descriptors (at the same time as descriptor filtering based on command line arguments, and addition of project-level execution-order), before the final list is sorted and passed to L{pysys.baserunner.BaseRunner}. The order of the returned list is random, so the caller is responsible for sorting this list to ensure deterministic behaviour. :rtype: list :raises UserError: Raised if no testcases can be found. """ assert not kwargs, 'reserved for future use: %s'%kwargs.keys() assert self.project, 'project must be specified' assert dir, 'dir must be specified' assert os.path.isabs(dir), 'dir must be an absolute path: %s'%dir project = self.project descriptors = [] ignoreSet = set(OSWALK_IGNORES+[DEFAULT_INPUT, DEFAULT_OUTPUT, DEFAULT_REFERENCE, "_pysys_templates"]) if project.properties.get('pysysTestDescriptorFileNames') or DEFAULT_DESCRIPTOR != ['pysystest.xml']: # compatibility mode descriptorSet = set([s.strip() for s in project.getProperty('pysysTestDescriptorFileNames', default=','.join(DEFAULT_DESCRIPTOR)).split(',')]) else: descriptorSet = None assert project.projectFile != None log = logging.getLogger('pysys.launcher') # although it's highly unlikely, if any test paths did slip outside the Windows 256 char limit, # it would be very dangerous to skip them (which is what os.walk does unless passed a \\?\ path), # so must use long-path-safe dir = toLongPathSafe(os.path.normpath(dir)) assert os.path.exists(dir), dir # sanity check if project.projectFile: projectroot = toLongPathSafe(os.path.normpath(os.path.dirname(project.projectFile))) def fastdirname(path): # This is much faster than os.path.dirname # The "or" is to account for minor difference fastdirname('/foo')='' whereas os.path.dirname='/' return path[:path.rfind(os.sep)] or '/' DIR_CONFIG_DESCRIPTOR = 'pysysdirconfig.xml' if not project.projectFile or not dir.startswith(projectroot): dirconfigs = None log.debug('Project file does not exist under "%s" so processing of %s files is disabled', dir, DIR_CONFIG_DESCRIPTOR) else: # find directory config descriptors between the project root and the testcase # dirs. We deliberately use project dir not current working dir since # we don't want descriptors to be loaded differently depending on where the # tests are run from (i.e. should be independent of cwd). # see also console_make.py which needs similar logic dirconfigs = {} # load any descriptors between the project dir up to (but not including) the dir we'll be walking searchdirsuffix = dir[len(projectroot)+1:].split(os.sep) if len(dir)>len(projectroot) else [] currentconfig = project._defaultDirConfig or _XMLDescriptorParser.DEFAULT_DESCRIPTOR for i in range(len(searchdirsuffix)): # up to but not including dir if i == 0: currentdir = projectroot else: currentdir = projectroot+os.sep+os.sep.join(searchdirsuffix[:i]) if pathexists(currentdir+os.sep+DIR_CONFIG_DESCRIPTOR): currentconfig = self._parseTestDescriptor(currentdir+os.sep+DIR_CONFIG_DESCRIPTOR, parentDirDefaults=currentconfig, isDirConfig=True) log.debug('Loaded directory configuration descriptor from %s: \n%s', currentdir, currentconfig) # this is the top-level directory that will be checked below dirconfigs[fastdirname(dir)] = currentconfig descriptorsToParse = [] # NB: if changing this logic be sure to test the special case dir='/foo' def visitDir(root): with os.scandir(root) as it: dirs = [] files = [] for entry in it: if entry.is_dir(): if entry.name in ignoreSet: continue dirs.append(entry.name) continue fname = entry.name if fname in ['.pysysignore', 'pysysignore']: log.debug('Skipping directory due to ignore file %s', entry.path) return files.append(fname) if dirconfigs is not None: parentconfig = dirconfigs[fastdirname(root)] assert parentconfig if next( (f for f in files if (f == DIR_CONFIG_DESCRIPTOR)), None): parentconfig = self._parseTestDescriptor(root+os.sep+DIR_CONFIG_DESCRIPTOR, parentDirDefaults=parentconfig, isDirConfig=True) log.debug('Loaded directory configuration descriptor from %s: \n%s', root, parentconfig) else: parentconfig = project._defaultDirConfig or _XMLDescriptorParser.DEFAULT_DESCRIPTOR # allow subclasses to modify descriptors list and/or avoid processing # subdirectories if self._handleSubDirectory(root, dirs, files, descriptors, parentDirDefaults=parentconfig): return if descriptorSet is None: intersection = [f for f in files if f.lower().startswith('pysystest.') and not f.endswith(IGNORED_PYSYSTEST_SUFFIXES)] else: # compatibility mode intersection = descriptorSet & set(files) if intersection: if len(intersection) > 1: raise Exception('Only one test should be present per directory but found %s in %s'%(intersection, root)) descriptorfile = fromLongPathSafe(root+os.sep+intersection.pop()) descriptorsToParse.append((descriptorfile, parentconfig)) # if this is a test dir, it never makes sense to look at sub directories return if dirconfigs is not None and len(dirs)>0: # stash it for when we navigate down to subdirectories # only add to dict if we're continuing to process children dirconfigs[root] = parentconfig for d in dirs: visitDir(root+os.sep+d) # end of visitDir() definition visitDir(dir) # Tried using multithreading with Python 3.9.5 but limited benefit approx 10%, probably due to GIL descriptors.extend(p for p in map(lambda element: self._parseTestDescriptor(descriptorfile=element[0], parentDirDefaults=element[1]), descriptorsToParse) if p) return descriptors
[docs] def _handleSubDirectory(self, dir, subdirs, files, descriptors, parentDirDefaults, **kwargs): """Overrides the handling of each sub-directory found while walking the directory tree during `loadDescriptors`. Can be used to add test descriptors, and/or add custom logic for preventing PySys searching a particular part of the directory tree perhaps based on the presence of specific files or subdirectories within it. This method is called before directories containing pysysignore files are stripped out. :param str dir: The full path of the directory to be processed. On Windows, this will be a long-path safe unicode string. :param list[str] subdirs: a list of the subdirectories under dir, which can be used to detect what kind of directory this is, and also can be modified by this method to prevent other loaders looking at subdirectories. :param list[str] files: a list of the files under dir, which can be used to detect what kind of directory this is, and also can be modified by this method to prevent other loaders looking at them. :param list[TestDescriptor] descriptors: A list of `TestDescriptor` items which this method can add to if desired. :param TestDescriptor parentDirDefaults: A `TestDescriptor` containing defaults from the parent directory, or None if there are none. Test loaders may optionally merge some of this information with test-specific information when creating test descriptors. :param dict kwargs: Reserved for future use. Pass this to the base class implementation when calling it. :return: If True, this part of the directory tree has been fully handled and PySys will not search under it any more. False to allow normal PySys handling of the directory to proceed. """ assert not kwargs, 'reserved for future use: %s'%kwargs.keys() # default implementation just delegates to any plugins for (key, pluginCls, pluginProperties) in getattr(parentDirDefaults, '_descriptorLoaderPlugins', []): plugin = self.__descriptorPluginCache.get(key, None) if plugin is None: plugin = pluginCls() plugin.project = self.project plugin.descriptorLoader = self pysys.utils.misc.setInstanceVariablesFromDict(plugin, pluginProperties, errorOnMissingVariables=True) plugin.setup(project=self.project) self.__descriptorPluginCache[key] = plugin if plugin.addDescriptorsFromDirectory(dir=dir, subdirs=subdirs, files=files, parentDirDefaults=parentDirDefaults, descriptors=descriptors, **kwargs): return True return False
[docs] def _parseTestDescriptor(self, descriptorfile, parentDirDefaults=None, isDirConfig=False, **kwargs): """ Parses a single descriptor file (typically an XML file, or a file of another type containing XML) for a testcase or directory configuration and returns the resulting descriptor. :param descriptorfile: The absolute path of the descriptor file. :param parentDirDefaults: A L{TestDescriptor} instance containing defaults to inherit from the parent directory, or None if none was found. :param isDirConfig: False for normal test descriptors, True for a directory configuration. :return: The L{TestDescriptor} instance, or None if none should be added for this descriptor file. Note that subclasses may modify the contents of the returned instance. :raises UserError: If the descriptor is invalid and an error should be displayed to the user without any Python stacktrace. The exception message must contain the path of the descriptorfile. """ assert len(kwargs)==0 or list(kwargs.keys())==['fileContents'], 'reserved for future use: %s'%kwargs.keys() try: return _XMLDescriptorParser.parse(descriptorfile, parentDirDefaults=parentDirDefaults, istest=not isDirConfig, project=self.project, **kwargs) except UserError: raise # no stack trace needed, will already include descriptorfile name except Exception as e: log.info('Failed to read descriptor %s: ', descriptorfile, exc_info=True) raise Exception("Error reading descriptor from '%s': %s - %s" % (descriptorfile, e.__class__.__name__, e)) from e