doxygen/xlink_master_2016_09_20_03.54.11/argument_parser_8py_source.html

 #

 # LSST Data Management System

 # Copyright 2008-2015 AURA/LSST.

 #

 # This product includes software developed by the

 # LSST Project (http://www.lsst.org/).

 #

 # This program is free software: you can redistribute it and/or modify

 # it under the terms of the GNU General Public License as published by

 # the Free Software Foundation, either version 3 of the License, or

 # (at your option) any later version.

 #

 # This program is distributed in the hope that it will be useful,

 # but WITHOUT ANY WARRANTY; without even the implied warranty of

 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 # GNU General Public License for more details.

 #

 # You should have received a copy of the LSST License Statement and

 # the GNU General Public License along with this program.  If not,

 # see <https://www.lsstcorp.org/LegalNotices/>.

 #

 from __future__ import absolute_import, division, print_function

 import abc

 import argparse

 import collections

 import fnmatch

 import itertools

 import os

 import re

 import shlex

 import sys

 import shutil

 import textwrap


 from builtins import zip

 from builtins import str

 from builtins import range

 from builtins import object


 import lsst.utils

 import lsst.pex.config as pexConfig

 import lsst.log as lsstLog

 import lsst.daf.persistence as dafPersist

 from future.utils import with_metaclass


 __all__ = ["ArgumentParser", "ConfigFileAction", "ConfigValueAction", "DataIdContainer",

            "DatasetArgument", "ConfigDatasetType", "InputOnlyArgumentParser"]


 DEFAULT_INPUT_NAME = "PIPE_INPUT_ROOT"

 DEFAULT_CALIB_NAME = "PIPE_CALIB_ROOT"

 DEFAULT_OUTPUT_NAME = "PIPE_OUTPUT_ROOT"


 def _fixPath(defName, path):

     """!Apply environment variable as default root, if present, and abspath


     @param[in] defName  name of environment variable containing default root path;

         if the environment variable does not exist then the path is relative

         to the current working directory

     @param[in] path     path relative to default root path

     @return abspath: path that has been expanded, or None if the environment variable does not exist

         and path is None

     """

     defRoot = os.environ.get(defName)

     if defRoot is None:

         if path is None:

             return None

         return os.path.abspath(path)

     return os.path.abspath(os.path.join(defRoot, path or ""))


 class DataIdContainer(object):

     """!A container for data IDs and associated data references


     Override for data IDs that require special handling to be converted to data references,

     and specify the override class as ContainerClass for add_id_argument.

     (If you don't want the argument parser to compute data references, you may use this class

     and specify doMakeDataRefList=False in add_id_argument.)

     """


     def __init__(self, level=None):

         """!Construct a DataIdContainer"""

         self.datasetType = None  # the actual dataset type, as specified on the command line (if dynamic)

         self.level = level

         self.idList = []

         self.refList = []


     def setDatasetType(self, datasetType):

         """!Set actual dataset type, once it is known"""

         self.datasetType = datasetType


     def castDataIds(self, butler):

         """!Validate data IDs and cast them to the correct type (modify idList in place).


         @param[in] butler       data butler (a \ref lsst.daf.persistence.butler.Butler

             "lsst.daf.persistence.Butler")

         """

         if self.datasetType is None:

             raise RuntimeError("Must call setDatasetType first")

         try:

             idKeyTypeDict = butler.getKeys(datasetType=self.datasetType, level=self.level)

         except KeyError:

             raise KeyError("Cannot get keys for datasetType %s at level %s" % (self.datasetType, self.level))


         for dataDict in self.idList:

             for key, strVal in dataDict.items():

                 try:

                     keyType = idKeyTypeDict[key]

                 except KeyError:

                     validKeys = sorted(idKeyTypeDict.keys())

                     raise KeyError("Unrecognized ID key %r; valid keys are: %s" % (key, validKeys))

                 if keyType != str:

                     try:

                         castVal = keyType(strVal)

                     except Exception:

                         raise TypeError("Cannot cast value %r to %s for ID key %r" % (strVal, keyType, key,))

                     dataDict[key] = castVal


     def makeDataRefList(self, namespace):

         """!Compute refList based on idList


         Not called if add_id_argument called with doMakeDataRefList=False


         @param[in] namespace    results of parsing command-line (with 'butler' and 'log' elements)

         """

         if self.datasetType is None:

             raise RuntimeError("Must call setDatasetType first")

         butler = namespace.butler

         for dataId in self.idList:

             refList = list(butler.subset(datasetType=self.datasetType, level=self.level, dataId=dataId))

             # exclude nonexistent data

             # this is a recursive test, e.g. for the sake of "raw" data

             refList = [dr for dr in refList if dataExists(butler=butler, datasetType=self.datasetType,

                                                           dataRef=dr)]

             if not refList:

                 namespace.log.warn("No data found for dataId=%s" % (dataId,))

                 continue

             self.refList += refList


 class DataIdArgument(object):

     """!Glorified struct for data about id arguments, used by ArgumentParser.add_id_argument"""


     def __init__(self, name, datasetType, level, doMakeDataRefList=True, ContainerClass=DataIdContainer):

         """!Constructor


         @param[in] name         name of identifier (argument name without dashes)

         @param[in] datasetType  type of dataset; specify a string for a fixed dataset type

             or a DatasetArgument for a dynamic dataset type (e.g. one specified by a command-line argument)

         @param[in] level        level of dataset, for butler

         @param[in] doMakeDataRefList    construct data references?

         @param[in] ContainerClass   class to contain data IDs and data references;

             the default class will work for many kinds of data, but you may have to override

             to compute some kinds of data references.

         """

         if name.startswith("-"):

             raise RuntimeError("Name %s must not start with -" % (name,))

         self.name = name

         self.datasetType = datasetType

         self.level = level

         self.doMakeDataRefList = bool(doMakeDataRefList)

         self.ContainerClass = ContainerClass

         self.argName = name.lstrip("-")


     @property

     def isDynamicDatasetType(self):

         """!Is the dataset type dynamic (specified on the command line)?"""

         return isinstance(self.datasetType, DynamicDatasetType)


     def getDatasetType(self, namespace):

         """!Return the dataset type as a string


         @param[in] namespace  parsed command

         """

         if self.isDynamicDatasetType:

             return self.datasetType.getDatasetType(namespace)

         else:

             return self.datasetType


 class DynamicDatasetType(with_metaclass(abc.ABCMeta, object)):

     """!Abstract base class for a dataset type determined from parsed command-line arguments

     """


     def addArgument(self, parser, idName):

         """!Add a command-line argument to specify dataset type name, if wanted


         @param[in] parser  argument parser to which to add argument

         @param[in] idName  name of data ID argument, without the leading "--", e.g. "id"


         The default implementation does nothing

         """

         pass


     @abc.abstractmethod

     def getDatasetType(self, namespace):

         """Return the dataset type as a string, based on parsed command-line arguments


         @param[in] namespace  parsed command

         """

         raise NotImplementedError("Subclasses must override")


 class DatasetArgument(DynamicDatasetType):

     """!A dataset type specified by a command-line argument.

     """


     def __init__(self,

                  name=None,

                  help="dataset type to process from input data repository",

                  default=None,

                  ):

         """!Construct a DatasetArgument


         @param[in] name  name of command-line argument (including leading "--", if appropriate)

             whose value is the dataset type; if None, uses --idName_dstype

             where idName is the name of the data ID argument (e.g. "id")

         @param[in] help  help string for the command-line argument

         @param[in] default  default value; if None, then the command-line option is required;

             ignored if the argument is positional (name does not start with "-")

             because positional argument do not support default values

         """

         DynamicDatasetType.__init__(self)

         self.name = name

         self.help = help

         self.default = default


     def getDatasetType(self, namespace):

         """Return the dataset type as a string, from the appropriate command-line argument


         @param[in] namespace  parsed command

         """

         argName = self.name.lstrip("-")

         return getattr(namespace, argName)


     def addArgument(self, parser, idName):

         """!Add a command-line argument to specify dataset type name


         Also set self.name if it is None

         """

         help = self.help if self.help else "dataset type for %s" % (idName,)

         if self.name is None:

             self.name = "--%s_dstype" % (idName,)

         requiredDict = dict()

         if self.name.startswith("-"):

             requiredDict = dict(required=self.default is None)

         parser.add_argument(

             self.name,

             default=self.default,

             help=help,

             **requiredDict)  # cannot specify required=None for positional arguments


 class ConfigDatasetType(DynamicDatasetType):

     """!A dataset type specified by a config parameter

     """


     def __init__(self, name):

         """!Construct a ConfigDatasetType


         @param[in] name  name of config option whose value is the dataset type

         """

         DynamicDatasetType.__init__(self)

         self.name = name


     def getDatasetType(self, namespace):

         """Return the dataset type as a string, from the appropriate config field


         @param[in] namespace  parsed command

         """

         # getattr does not work reliably if the config field name is dotted,

         # so step through one level at a time

         keyList = self.name.split(".")

         value = namespace.config

         for key in keyList:

             try:

                 value = getattr(value, key)

             except KeyError:

                 raise RuntimeError("Cannot find config parameter %r" % (self.name,))

         return value


 class ArgumentParser(argparse.ArgumentParser):

     """!An argument parser for pipeline tasks that is based on argparse.ArgumentParser


     Users may wish to add additional arguments before calling parse_args.


     @note

     - I would prefer to check data ID keys and values as they are parsed,

       but the required information comes from the butler, so I have to construct a butler

       before I do this checking. Constructing a butler is slow, so I only want do it once,

       after parsing the command line, so as to catch syntax errors quickly.

     """

     requireOutput = True  # Require an output directory to be specified?


     def __init__(self, name, usage="%(prog)s input [options]", **kwargs):

         """!Construct an ArgumentParser


         @param[in] name     name of top-level task; used to identify camera-specific override files

         @param[in] usage    usage string

         @param[in] **kwargs additional keyword arguments for argparse.ArgumentParser

         """

         self._name = name

         self._dataIdArgDict = {}  # Dict of data identifier specifications, by argument name

         argparse.ArgumentParser.__init__(self,

                                          usage=usage,

                                          fromfile_prefix_chars='@',

                                          epilog=textwrap.dedent("""Notes:

             * --config, --configfile, --id, --loglevel and @file may appear multiple times;

                 all values are used, in order left to right

             * @file reads command-line options from the specified file:

                 * data may be distributed among multiple lines (e.g. one option per line)

                 * data after # is treated as a comment and ignored

                 * blank lines and lines starting with # are ignored

             * To specify multiple values for an option, do not use = after the option name:

                 * right: --configfile foo bar

                 * wrong: --configfile=foo bar

             """),

                                          formatter_class=argparse.RawDescriptionHelpFormatter,

                                          **kwargs)

         self.add_argument(metavar='input', dest="rawInput",

                           help="path to input data repository, relative to $%s" % (DEFAULT_INPUT_NAME,))

         self.add_argument("--calib", dest="rawCalib",

                           help="path to input calibration repository, relative to $%s" %

                           (DEFAULT_CALIB_NAME,))

         self.add_argument("--output", dest="rawOutput",

                           help="path to output data repository (need not exist), relative to $%s" %

                           (DEFAULT_OUTPUT_NAME,))

         self.add_argument("--rerun", dest="rawRerun", metavar="[INPUT:]OUTPUT",

                           help="rerun name: sets OUTPUT to ROOT/rerun/OUTPUT; "

                                "optionally sets ROOT to ROOT/rerun/INPUT")

         self.add_argument("-c", "--config", nargs="*", action=ConfigValueAction,

                           help="config override(s), e.g. -c foo=newfoo bar.baz=3", metavar="NAME=VALUE")

         self.add_argument("-C", "--configfile", dest="configfile", nargs="*", action=ConfigFileAction,

                           help="config override file(s)")

         self.add_argument("-L", "--loglevel", nargs="*", action=LogLevelAction,

                           help="logging level; supported levels are [trace|debug|info|warn|error|fatal]",

                           metavar="LEVEL|COMPONENT=LEVEL")

         self.add_argument("--longlog", action="store_true", help="use a more verbose format for the logging")

         self.add_argument("--debug", action="store_true", help="enable debugging output?")

         self.add_argument("--doraise", action="store_true",

                           help="raise an exception on error (else log a message and continue)?")

         self.add_argument("--profile", help="Dump cProfile statistics to filename")

         self.add_argument("--show", nargs="+", default=(),

                           help="display the specified information to stdout and quit "

                                "(unless run is specified).")

         self.add_argument("-j", "--processes", type=int, default=1, help="Number of processes to use")

         self.add_argument("-t", "--timeout", type=float,

                           help="Timeout for multiprocessing; maximum wall time (sec)")

         self.add_argument("--clobber-output", action="store_true", dest="clobberOutput", default=False,

                           help=("remove and re-create the output directory if it already exists "

                                 "(safe with -j, but not all other forms of parallel execution)"))

         self.add_argument("--clobber-config", action="store_true", dest="clobberConfig", default=False,

                           help=("backup and then overwrite existing config files instead of checking them "

                                 "(safe with -j, but not all other forms of parallel execution)"))

         self.add_argument("--no-backup-config", action="store_true", dest="noBackupConfig", default=False,

                           help="Don't copy config to file~N backup.")

         self.add_argument("--clobber-versions", action="store_true", dest="clobberVersions", default=False,

                           help=("backup and then overwrite existing package versions instead of checking"

                                 "them (safe with -j, but not all other forms of parallel execution)"))

         self.add_argument("--no-versions", action="store_true", dest="noVersions", default=False,

                           help="don't check package versions; useful for development")

         lsstLog.configure_prop("""

 log4j.rootLogger=INFO, A1

 log4j.appender.A1=ConsoleAppender

 log4j.appender.A1.Target=System.err

 log4j.appender.A1.layout=PatternLayout

 log4j.appender.A1.layout.ConversionPattern=%c %p: %m%n

 """)


     def add_id_argument(self, name, datasetType, help, level=None, doMakeDataRefList=True,

                         ContainerClass=DataIdContainer):

         """!Add a data ID argument


         Add an argument to specify data IDs. If datasetType is an instance of DatasetArgument,

         then add a second argument to specify the dataset type.


         @param[in] name                 data ID argument (including leading dashes, if wanted)

         @param[in] datasetType          type of dataset; supply a string for a fixed dataset type,

             or a DynamicDatasetType, such as DatasetArgument, for a dynamically determined dataset type

         @param[in] help                 help string for the argument

         @param[in] level                level of dataset, for butler

         @param[in] doMakeDataRefList    construct data references?

         @param[in] ContainerClass       data ID container class to use to contain results;

             override the default if you need a special means of computing data references from data IDs


         The associated data is put into namespace.<dataIdArgument.name> as an instance of ContainerClass;

         the container includes fields:

         - idList: a list of data ID dicts

         - refList: a list of butler data references (empty if doMakeDataRefList false)

         """

         argName = name.lstrip("-")


         if argName in self._dataIdArgDict:

             raise RuntimeError("Data ID argument %s already exists" % (name,))

         if argName in set(("camera", "config", "butler", "log", "obsPkg")):

             raise RuntimeError("Data ID argument %s is a reserved name" % (name,))


         self.add_argument(name, nargs="*", action=IdValueAction, help=help,

                           metavar="KEY=VALUE1[^VALUE2[^VALUE3...]")


         dataIdArgument = DataIdArgument(

             name=argName,

             datasetType=datasetType,

             level=level,

             doMakeDataRefList=doMakeDataRefList,

             ContainerClass=ContainerClass,

         )


         if dataIdArgument.isDynamicDatasetType:

             datasetType.addArgument(parser=self, idName=argName)


         self._dataIdArgDict[argName] = dataIdArgument


     def parse_args(self, config, args=None, log=None, override=None):

         """!Parse arguments for a pipeline task


         @param[in,out] config   config for the task being run

         @param[in] args         argument list; if None use sys.argv[1:]

         @param[in] log          log (instance lsst.log Log); if None use the default log

         @param[in] override     a config override function; it must take the root config object

             as its only argument and must modify the config in place.

             This function is called after camera-specific overrides files are applied, and before

             command-line config overrides are applied (thus allowing the user the final word).


         @return namespace: an argparse.Namespace containing many useful fields including:

         - camera: camera name

         - config: the supplied config with all overrides applied, validated and frozen

         - butler: a butler for the data

         - an entry for each of the data ID arguments registered by add_id_argument(),

           the value of which is a DataIdArgument that includes public elements 'idList' and 'refList'

         - log: a lsst.log Log

         - an entry for each command-line argument, with the following exceptions:

           - config is the supplied config, suitably updated

           - configfile, id and loglevel are all missing

         - obsPkg: name of obs_ package for this camera

         """

         if args is None:

             args = sys.argv[1:]


         if len(args) < 1 or args[0].startswith("-") or args[0].startswith("@"):

             self.print_help()

             if len(args) == 1 and args[0] in ("-h", "--help"):

                 self.exit()

             else:

                 self.exit("%s: error: Must specify input as first argument" % self.prog)


         # Note that --rerun may change namespace.input, but if it does we verify that the

         # new input has the same mapper class.

         namespace = argparse.Namespace()

         namespace.input = _fixPath(DEFAULT_INPUT_NAME, args[0])

         if not os.path.isdir(namespace.input):

             self.error("Error: input=%r not found" % (namespace.input,))


         namespace.config = config

         namespace.log = log if log is not None else lsstLog.Log.getDefaultLogger()

         mapperClass = dafPersist.Butler.getMapperClass(namespace.input)

         namespace.camera = mapperClass.getCameraName()

         namespace.obsPkg = mapperClass.getPackageName()


         self.handleCamera(namespace)


         self._applyInitialOverrides(namespace)

         if override is not None:

             override(namespace.config)


         # Add data ID containers to namespace

         for dataIdArgument in self._dataIdArgDict.values():

             setattr(namespace, dataIdArgument.name, dataIdArgument.ContainerClass(level=dataIdArgument.level))


         namespace = argparse.ArgumentParser.parse_args(self, args=args, namespace=namespace)

         del namespace.configfile


         self._parseDirectories(namespace)


         if namespace.clobberOutput:

             if namespace.output is None:

                 self.error("--clobber-output is only valid with --output or --rerun")

             elif namespace.output == namespace.input:

                 self.error("--clobber-output is not valid when the output and input repos are the same")

             if os.path.exists(namespace.output):

                 namespace.log.info("Removing output repo %s for --clobber-output" % namespace.output)

                 shutil.rmtree(namespace.output)


         namespace.log.info("input=%s" % (namespace.input,))

         namespace.log.info("calib=%s" % (namespace.calib,))

         namespace.log.info("output=%s" % (namespace.output,))


         obeyShowArgument(namespace.show, namespace.config, exit=False)


         # No environment variable or --output or --rerun specified.

         if self.requireOutput and namespace.output is None and namespace.rerun is None:

             self.error("no output directory specified.\n"

                        "An output directory must be specified with the --output or --rerun\n"

                        "command-line arguments.\n")


         namespace.butler = dafPersist.Butler(

             root=namespace.input,

             calibRoot=namespace.calib,

             outputRoot=namespace.output,

         )


         # convert data in each of the identifier lists to proper types

         # this is done after constructing the butler, hence after parsing the command line,

         # because it takes a long time to construct a butler

         self._processDataIds(namespace)

         if "data" in namespace.show:

             for dataIdName in self._dataIdArgDict.keys():

                 for dataRef in getattr(namespace, dataIdName).refList:

                     print("%s dataRef.dataId = %s" % (dataIdName, dataRef.dataId))


         if namespace.show and "run" not in namespace.show:

             sys.exit(0)


         if namespace.debug:

             try:

                 import debug

                 assert debug  # silence pyflakes

             except ImportError:

                 sys.stderr.write("Warning: no 'debug' module found\n")

                 namespace.debug = False


         del namespace.loglevel


         if namespace.longlog:

             lsstLog.configure_prop("""

 log4j.rootLogger=INFO, A1

 log4j.appender.A1=ConsoleAppender

 log4j.appender.A1.Target=System.err

 log4j.appender.A1.layout=PatternLayout

 log4j.appender.A1.layout.ConversionPattern=%-5p %d{yyyy-MM-ddThh:mm:ss.sss} %c (%X{LABEL})(%F:%L)- %m%n

 """)

         del namespace.longlog


         namespace.config.validate()

         namespace.config.freeze()


         return namespace


     def _parseDirectories(self, namespace):

         """Parse input, output and calib directories


         This allows for hacking the directories, e.g., to include a "rerun".

         Modifications are made to the 'namespace' object in-place.

         """

         mapperClass = dafPersist.Butler.getMapperClass(_fixPath(DEFAULT_INPUT_NAME, namespace.rawInput))

         namespace.calib = _fixPath(DEFAULT_CALIB_NAME, namespace.rawCalib)


         # If an output directory is specified, process it and assign it to the namespace

         if namespace.rawOutput:

             namespace.output = _fixPath(DEFAULT_OUTPUT_NAME, namespace.rawOutput)

         else:

             namespace.output = None


         # This section processes the rerun argument, if rerun is specified as a colon separated

         # value, it will be parsed as an input and output. The input value will be overridden if

         # previously specified (but a check is made to make sure both inputs use the same mapper)

         if namespace.rawRerun:

             if namespace.output:

                 self.error("Error: cannot specify both --output and --rerun")

             namespace.rerun = namespace.rawRerun.split(":")

             rerunDir = [os.path.join(namespace.input, "rerun", dd) for dd in namespace.rerun]

             modifiedInput = False

             if len(rerunDir) == 2:

                 namespace.input, namespace.output = rerunDir

                 modifiedInput = True

             elif len(rerunDir) == 1:

                 namespace.output = rerunDir[0]

                 if os.path.exists(namespace.output):

                     namespace.input = os.path.realpath(os.path.join(namespace.output, "_parent"))

                     modifiedInput = True

             else:

                 self.error("Error: invalid argument for --rerun: %s" % namespace.rerun)

             if modifiedInput and dafPersist.Butler.getMapperClass(namespace.input) != mapperClass:

                 self.error("Error: input directory specified by --rerun must have the same mapper as INPUT")

         else:

             namespace.rerun = None

         del namespace.rawInput

         del namespace.rawCalib

         del namespace.rawOutput

         del namespace.rawRerun


     def _processDataIds(self, namespace):

         """!Process the parsed data for each data ID argument


         Processing includes:

         - Validate data ID keys

         - Cast the data ID values to the correct type

         - Compute data references from data IDs


         @param[in,out] namespace    parsed namespace (an argparse.Namespace);

             reads these attributes:

             - butler

             - log

             - config, if any dynamic dataset types are set by a config parameter

             - dataset type arguments (e.g. id_dstype), if any dynamic dataset types are specified by such

             and modifies these attributes:

             - <name> for each data ID argument registered using add_id_argument

         """

         for dataIdArgument in self._dataIdArgDict.values():

             dataIdContainer = getattr(namespace, dataIdArgument.name)

             dataIdContainer.setDatasetType(dataIdArgument.getDatasetType(namespace))

             if dataIdArgument.doMakeDataRefList:

                 try:

                     dataIdContainer.castDataIds(butler=namespace.butler)

                 except (KeyError, TypeError) as e:

                     # failure of castDataIds indicates invalid command args

                     self.error(e)


                 # failure of makeDataRefList indicates a bug that wants a traceback

                 dataIdContainer.makeDataRefList(namespace)


     def _applyInitialOverrides(self, namespace):

         """!Apply obs-package-specific and camera-specific config override files, if found


         @param[in] namespace    parsed namespace (an argparse.Namespace);

             reads these attributes:

             - obsPkg


         Look in the package namespace.obsPkg for files:

         - config/<task_name>.py

         - config/<camera_name>/<task_name>.py

         and load if found

         """

         obsPkgDir = lsst.utils.getPackageDir(namespace.obsPkg)

         fileName = self._name + ".py"

         for filePath in (

             os.path.join(obsPkgDir, "config", fileName),

             os.path.join(obsPkgDir, "config", namespace.camera, fileName),

         ):

             if os.path.exists(filePath):

                 namespace.log.info("Loading config overrride file %r" % (filePath,))

                 namespace.config.load(filePath)

             else:

                 namespace.log.info("Config override file does not exist: %r" % (filePath,))


     def handleCamera(self, namespace):

         """!Perform camera-specific operations before parsing the command line.


         The default implementation does nothing.


         @param[in,out] namespace    namespace (an argparse.Namespace) with the following fields:

             - camera: the camera name

             - config: the config passed to parse_args, with no overrides applied

             - obsPkg: the obs_ package for this camera

             - log: a lsst.log Log

         """

         pass


     def convert_arg_line_to_args(self, arg_line):

         """!Allow files of arguments referenced by `@<path>` to contain multiple values on each line


         @param[in] arg_line     line of text read from an argument file

         """

         arg_line = arg_line.strip()

         if not arg_line or arg_line.startswith("#"):

             return

         for arg in shlex.split(arg_line, comments=True, posix=True):

             if not arg.strip():

                 continue

             yield arg


 class InputOnlyArgumentParser(ArgumentParser):

     """An ArgumentParser for pipeline tasks that don't write any output"""

     requireOutput = False  # We're not going to write anything


 def getTaskDict(config, taskDict=None, baseName=""):

     """!Get a dictionary of task info for all subtasks in a config


     Designed to be called recursively; the user should call with only a config

     (leaving taskDict and baseName at their default values).


     @param[in] config           configuration to process, an instance of lsst.pex.config.Config

     @param[in,out] taskDict     users should not specify this argument;

         (supports recursion; if provided, taskDict is updated in place, else a new dict is started)

     @param[in] baseName         users should not specify this argument.

         (supports recursion: if a non-empty string then a period is appended and the result is used

         as a prefix for additional entries in taskDict; otherwise no prefix is used)

     @return taskDict: a dict of config field name: task name

     """

     if taskDict is None:

         taskDict = dict()

     for fieldName, field in config.items():

         if hasattr(field, "value") and hasattr(field, "target"):

             subConfig = field.value

             if isinstance(subConfig, pexConfig.Config):

                 subBaseName = "%s.%s" % (baseName, fieldName) if baseName else fieldName

                 try:

                     taskName = "%s.%s" % (field.target.__module__, field.target.__name__)

                 except Exception:

                     taskName = repr(field.target)

                 taskDict[subBaseName] = taskName

                 getTaskDict(config=subConfig, taskDict=taskDict, baseName=subBaseName)

     return taskDict


 def obeyShowArgument(showOpts, config=None, exit=False):

     """!Process arguments specified with --show (but ignores "data")


     @param showOpts  List of options passed to --show

     @param config    The provided config

     @param exit      Exit if "run" isn't included in showOpts


     Supports the following options in showOpts:

     - config[=PAT]   Dump all the config entries, or just the ones that match the glob pattern

     - tasks      Show task hierarchy

     - data       Ignored; to be processed by caller

     - run        Keep going (the default behaviour is to exit if --show is specified)


     Calls sys.exit(1) if any other option found.

     """

     if not showOpts:

         return


     for what in showOpts:

         mat = re.search(r"^config(?:=(.+))?", what)

         if mat:

             pattern = mat.group(1)

             if pattern:

                 class FilteredStream(object):

                     """A file object that only prints lines that match the glob "pattern"


                     N.b. Newlines are silently discarded and reinserted;  crude but effective.

                     """


                     def __init__(self, pattern):

                         # obey case if pattern isn't lowecase or requests NOIGNORECASE

                         mat = re.search(r"(.*):NOIGNORECASE$", pattern)


                         if mat:

                             pattern = mat.group(1)

                             self._pattern = re.compile(fnmatch.translate(pattern))

                         else:

                             if pattern != pattern.lower():

                                 print(u"Matching \"%s\" without regard to case "

                                       "(append :NOIGNORECASE to prevent this)" % (pattern,), file=sys.stdout)

                             self._pattern = re.compile(fnmatch.translate(pattern), re.IGNORECASE)


                     def write(self, showStr):

                         showStr = showStr.rstrip()

                         # Strip off doc string line(s) and cut off at "=" for string matching

                         matchStr = showStr.split("\n")[-1].split("=")[0]

                         if self._pattern.search(matchStr):

                             print(u"\n" + showStr)


                 fd = FilteredStream(pattern)

             else:

                 fd = sys.stdout


             config.saveToStream(fd, "config")

         elif what == "data":

             pass

         elif what == "run":

             pass

         elif what == "tasks":

             showTaskHierarchy(config)

         else:

             print(u"Unknown value for show: %s (choose from '%s')" %

                   (what, "', '".join("config[=XXX] data tasks run".split())), file=sys.stderr)

             sys.exit(1)


     if exit and "run" not in showOpts:

         sys.exit(0)


 def showTaskHierarchy(config):

     """!Print task hierarchy to stdout


     @param[in] config: configuration to process (an lsst.pex.config.Config)

     """

     print(u"Subtasks:")

     taskDict = getTaskDict(config=config)


     fieldNameList = sorted(taskDict.keys())

     for fieldName in fieldNameList:

         taskName = taskDict[fieldName]

         print(u"%s: %s" % (fieldName, taskName))


 class ConfigValueAction(argparse.Action):

     """!argparse action callback to override config parameters using name=value pairs from the command line

     """


     def __call__(self, parser, namespace, values, option_string):

         """!Override one or more config name value pairs


         @param[in] parser           argument parser (instance of ArgumentParser)

         @param[in,out] namespace    parsed command (an instance of argparse.Namespace);

             updated values:

             - namespace.config

         @param[in] values           a list of configItemName=value pairs

         @param[in] option_string    option value specified by the user (a str)

         """

         if namespace.config is None:

             return

         for nameValue in values:

             name, sep, valueStr = nameValue.partition("=")

             if not valueStr:

                 parser.error("%s value %s must be in form name=value" % (option_string, nameValue))


             # see if setting the string value works; if not, try eval

             try:

                 setDottedAttr(namespace.config, name, valueStr)

             except AttributeError:

                 parser.error("no config field: %s" % (name,))

             except Exception:

                 try:

                     value = eval(valueStr, {})

                 except Exception:

                     parser.error("cannot parse %r as a value for %s" % (valueStr, name))

                 try:

                     setDottedAttr(namespace.config, name, value)

                 except Exception as e:

                     parser.error("cannot set config.%s=%r: %s" % (name, value, e))


 class ConfigFileAction(argparse.Action):

     """!argparse action to load config overrides from one or more files

     """


     def __call__(self, parser, namespace, values, option_string=None):

         """!Load one or more files of config overrides


         @param[in] parser           argument parser (instance of ArgumentParser)

         @param[in,out] namespace    parsed command (an instance of argparse.Namespace);

             updated values:

             - namespace.config

         @param[in] values           a list of data config file paths

         @param[in] option_string    option value specified by the user (a str)

         """

         if namespace.config is None:

             return

         for configfile in values:

             try:

                 namespace.config.load(configfile)

             except Exception as e:

                 parser.error("cannot load config file %r: %s" % (configfile, e))


 class IdValueAction(argparse.Action):

     """!argparse action callback to process a data ID into a dict

     """


     def __call__(self, parser, namespace, values, option_string):

         """!Parse --id data and append results to namespace.<argument>.idList


         @param[in] parser           argument parser (instance of ArgumentParser)

         @param[in,out] namespace    parsed command (an instance of argparse.Namespace);

             updated values:

             - <idName>.idList, where <idName> is the name of the ID argument,

                 for instance "id" for ID argument --id

         @param[in] values           a list of data IDs; see data format below

         @param[in] option_string    option value specified by the user (a str)


         The data format is:

         key1=value1_1[^value1_2[^value1_3...] key2=value2_1[^value2_2[^value2_3...]...


         The values (e.g. value1_1) may either be a string, or of the form "int..int" (e.g. "1..3")

         which is interpreted as "1^2^3" (inclusive, unlike a python range). So "0^2..4^7..9" is

         equivalent to "0^2^3^4^7^8^9".  You may also specify a stride: "1..5:2" is "1^3^5"


         The cross product is computed for keys with multiple values. For example:

             --id visit 1^2 ccd 1,1^2,2

         results in the following data ID dicts being appended to namespace.<argument>.idList:

             {"visit":1, "ccd":"1,1"}

             {"visit":2, "ccd":"1,1"}

             {"visit":1, "ccd":"2,2"}

             {"visit":2, "ccd":"2,2"}

         """

         if namespace.config is None:

             return

         idDict = collections.OrderedDict()

         for nameValue in values:

             name, sep, valueStr = nameValue.partition("=")

             if name in idDict:

                 parser.error("%s appears multiple times in one ID argument: %s" % (name, option_string))

             idDict[name] = []

             for v in valueStr.split("^"):

                 mat = re.search(r"^(\d+)\.\.(\d+)(?::(\d+))?$", v)

                 if mat:

                     v1 = int(mat.group(1))

                     v2 = int(mat.group(2))

                     v3 = mat.group(3)

                     v3 = int(v3) if v3 else 1

                     for v in range(v1, v2 + 1, v3):

                         idDict[name].append(str(v))

                 else:

                     idDict[name].append(v)


         iterList = [idDict[key] for key in idDict.keys()]

         idDictList = [collections.OrderedDict(zip(idDict.keys(), valList))

                       for valList in itertools.product(*iterList)]


         argName = option_string.lstrip("-")

         ident = getattr(namespace, argName)

         ident.idList += idDictList


 class LogLevelAction(argparse.Action):

     """!argparse action to set log level

     """


     def __call__(self, parser, namespace, values, option_string):

         """!Set trace level


         @param[in] parser       argument parser (instance of ArgumentParser)

         @param[in] namespace    parsed command (an instance of argparse.Namespace); ignored

         @param[in] values       a list of trace levels;

             each item must be of the form 'component_name=level' or 'level',

             where level is a keyword (not case sensitive) or an integer

         @param[in] option_string    option value specified by the user (a str)

         """

         permittedLevelList = ('TRACE', 'DEBUG', 'INFO', 'WARN', 'ERROR', 'FATAL')

         permittedLevelSet = set(permittedLevelList)

         for componentLevel in values:

             component, sep, levelStr = componentLevel.partition("=")

             if not levelStr:

                 levelStr, component = component, None

             logLevelUpr = levelStr.upper()

             if logLevelUpr in permittedLevelSet:

                 logLevel = getattr(lsstLog.Log, logLevelUpr)

             else:

                 parser.error("loglevel=%r not one of %s" % (levelStr, permittedLevelList))

             if component is None:

                 namespace.log.setLevel(logLevel)

             else:

                 lsstLog.Log.getLogger(component).setLevel(logLevel)


 def setDottedAttr(item, name, value):

     """!Like setattr, but accepts hierarchical names, e.g. foo.bar.baz


     @param[in,out] item     object whose attribute is to be set

     @param[in] name         name of item to set

     @param[in] value        new value for the item


     For example if name is foo.bar.baz then item.foo.bar.baz is set to the specified value.

     """

     subitem = item

     subnameList = name.split(".")

     for subname in subnameList[:-1]:

         subitem = getattr(subitem, subname)

     setattr(subitem, subnameList[-1], value)


 def getDottedAttr(item, name):

     """!Like getattr, but accepts hierarchical names, e.g. foo.bar.baz


     @param[in] item         object whose attribute is to be returned

     @param[in] name         name of item to get


     For example if name is foo.bar.baz then returns item.foo.bar.baz

     """

     subitem = item

     for subname in name.split("."):

         subitem = getattr(subitem, subname)

     return subitem


 def dataExists(butler, datasetType, dataRef):

     """!Return True if data exists at the current level or any data exists at a deeper level, False otherwise


     @param[in] butler       data butler (a \ref lsst.daf.persistence.butler.Butler

         "lsst.daf.persistence.Butler")

     @param[in] datasetType  dataset type (a str)

     @param[in] dataRef      butler data reference (a \ref lsst.daf.persistence.butlerSubset.ButlerDataRef

         "lsst.daf.persistence.ButlerDataRef")

     """

     subDRList = dataRef.subItems()

     if subDRList:

         for subDR in subDRList:

             if dataExists(butler, datasetType, subDR):

                 return True

         return False

     else:

         return butler.datasetExists(datasetType=datasetType, dataId=dataRef.dataId)

lsst.pipe::base.argumentParser.ConfigDatasetType.getDatasetType
def getDatasetType
Definition: argumentParser.py:267

lsst.pipe::base.argumentParser.DataIdContainer.setDatasetType
def setDatasetType
Set actual dataset type, once it is known.
Definition: argumentParser.py:89

lsst.pipe::base.argumentParser.DataIdContainer.castDataIds
def castDataIds
Validate data IDs and cast them to the correct type (modify idList in place).
Definition: argumentParser.py:93

lsst.pipe::base.argumentParser.LogLevelAction
argparse action to set log level
Definition: argumentParser.py:902

lsst.pipe::base.argumentParser.ArgumentParser
An argument parser for pipeline tasks that is based on argparse.ArgumentParser.
Definition: argumentParser.py:284

lsst.pipe::base.argumentParser.dataExists
def dataExists
Return True if data exists at the current level or any data exists at a deeper level, False otherwise.
Definition: argumentParser.py:963

lsst::utils
Definition: Demangle.h:31

lsst::daf::persistence
Definition: BoostStorage.cc:53

lsst.pipe::base.argumentParser.DatasetArgument
A dataset type specified by a command-line argument.
Definition: argumentParser.py:205

lsst.pipe::base.argumentParser.DataIdContainer.datasetType
datasetType
Definition: argumentParser.py:84

lsst.pipe::base.argumentParser.DataIdContainer.level
level
Definition: argumentParser.py:85

lsst.pipe::base.argumentParser.ArgumentParser._name
_name
Definition: argumentParser.py:304

lsst.pipe::base.argumentParser.showTaskHierarchy
def showTaskHierarchy
Print task hierarchy to stdout.
Definition: argumentParser.py:769

lsst.pipe::base.argumentParser.ArgumentParser.requireOutput
requireOutput
Definition: argumentParser.py:295

lsst.pipe::base.argumentParser.DataIdArgument
Glorified struct for data about id arguments, used by ArgumentParser.add_id_argument.
Definition: argumentParser.py:142

lsst.pipe::base.argumentParser.setDottedAttr
def setDottedAttr
Like setattr, but accepts hierarchical names, e.g.
Definition: argumentParser.py:933

lsst.pex.config
Definition: __init__.py:1

lsst.pipe::base.argumentParser.InputOnlyArgumentParser
Definition: argumentParser.py:665

lsst.pipe::base.argumentParser.IdValueAction.__call__
def __call__
Parse –id data and append results to namespace.
Definition: argumentParser.py:847

lsst.pipe::base.argumentParser.DataIdArgument.doMakeDataRefList
doMakeDataRefList
Definition: argumentParser.py:162

lsst.pipe::base.argumentParser.ConfigValueAction
argparse action callback to override config parameters using name=value pairs from the command line ...
Definition: argumentParser.py:783

lsst.pipe::base.argumentParser.DataIdArgument.__init__
def __init__
Constructor.
Definition: argumentParser.py:145

lsst.pipe::base.argumentParser.getTaskDict
def getTaskDict
Get a dictionary of task info for all subtasks in a config.
Definition: argumentParser.py:670

lsst.pipe::base.argumentParser.ArgumentParser._parseDirectories
def _parseDirectories
Definition: argumentParser.py:541

lsst.pipe::base.argumentParser.ArgumentParser.add_id_argument
def add_id_argument
Add a data ID argument.
Definition: argumentParser.py:373

lsst::utils::getPackageDir
std::string getPackageDir(std::string const &packageName)
return the root directory of a setup package
Definition: Utils.cc:34

lsst::log
Definition: Log.h:716

lsst.pipe::base.argumentParser.ArgumentParser._applyInitialOverrides
def _applyInitialOverrides
Apply obs-package-specific and camera-specific config override files, if found.
Definition: argumentParser.py:614

lsst.pipe::base.argumentParser.DataIdContainer.refList
refList
Definition: argumentParser.py:87

lsst.pipe::base.argumentParser.DataIdContainer.makeDataRefList
def makeDataRefList
Compute refList based on idList.
Definition: argumentParser.py:120

lsst.pipe::base.argumentParser.DatasetArgument.__init__
def __init__
Construct a DatasetArgument.
Definition: argumentParser.py:213

lsst.pipe::base.argumentParser.ArgumentParser.convert_arg_line_to_args
def convert_arg_line_to_args
Allow files of arguments referenced by @&lt;path&gt; to contain multiple values on each line...
Definition: argumentParser.py:651

lsst.pipe::base.argumentParser.getDottedAttr
def getDottedAttr
Like getattr, but accepts hierarchical names, e.g.
Definition: argumentParser.py:949

lsst.pipe::base.argumentParser.DatasetArgument.addArgument
def addArgument
Add a command-line argument to specify dataset type name.
Definition: argumentParser.py:237

lsst.pipe::base.argumentParser.DatasetArgument.name
name
Definition: argumentParser.py:225

lsst.pipe::base.argumentParser.ConfigFileAction.__call__
def __call__
Load one or more files of config overrides.
Definition: argumentParser.py:824

lsst.pipe::base.argumentParser.DataIdArgument.isDynamicDatasetType
def isDynamicDatasetType
Is the dataset type dynamic (specified on the command line)?
Definition: argumentParser.py:167

lsst.pipe::base.argumentParser.DatasetArgument.help
help
Definition: argumentParser.py:226

lsst.pipe::base.argumentParser.LogLevelAction.__call__
def __call__
Set trace level.
Definition: argumentParser.py:906

lsst.pipe::base.argumentParser.DataIdArgument.argName
argName
Definition: argumentParser.py:164

lsst.pipe::base.argumentParser.ConfigValueAction.__call__
def __call__
Override one or more config name value pairs.
Definition: argumentParser.py:787

lsst.pipe::base.argumentParser.DataIdArgument.ContainerClass
ContainerClass
Definition: argumentParser.py:163

lsst.pipe::base.argumentParser.IdValueAction
argparse action callback to process a data ID into a dict
Definition: argumentParser.py:843

lsst.pipe::base.argumentParser.DatasetArgument.default
default
Definition: argumentParser.py:227

lsst.pipe::base.argumentParser.ConfigDatasetType.__init__
def __init__
Construct a ConfigDatasetType.
Definition: argumentParser.py:259

lsst.pipe::base.argumentParser.DynamicDatasetType.getDatasetType
def getDatasetType
Definition: argumentParser.py:197

lsst.pipe::base.argumentParser.DatasetArgument.getDatasetType
def getDatasetType
Definition: argumentParser.py:229

lsst::log.log.setLevel
def setLevel
Definition: log.py:71

lsst.pipe::base.argumentParser.ArgumentParser.handleCamera
def handleCamera
Perform camera-specific operations before parsing the command line.
Definition: argumentParser.py:638

lsst.pipe::base.argumentParser.ArgumentParser.parse_args
def parse_args
Parse arguments for a pipeline task.
Definition: argumentParser.py:416

lsst.pipe::base.argumentParser.ArgumentParser._processDataIds
def _processDataIds
Process the parsed data for each data ID argument.
Definition: argumentParser.py:584

lsst.pipe::base.argumentParser.ArgumentParser._dataIdArgDict
_dataIdArgDict
Definition: argumentParser.py:305

lsst.pipe::base.argumentParser.ConfigDatasetType
A dataset type specified by a config parameter.
Definition: argumentParser.py:255

lsst.pipe::base.argumentParser.ArgumentParser.__init__
def __init__
Construct an ArgumentParser.
Definition: argumentParser.py:297

lsst.pipe::base.argumentParser.obeyShowArgument
def obeyShowArgument
Process arguments specified with –show (but ignores &quot;data&quot;)
Definition: argumentParser.py:700

lsst.pipe::base.argumentParser.DynamicDatasetType
Abstract base class for a dataset type determined from parsed command-line arguments.
Definition: argumentParser.py:182

lsst.pipe::base.argumentParser.DataIdArgument.datasetType
datasetType
Definition: argumentParser.py:160

lsst.pipe::base.argumentParser._fixPath
def _fixPath
Apply environment variable as default root, if present, and abspath.
Definition: argumentParser.py:55

lsst.pipe::base.argumentParser.DynamicDatasetType.addArgument
def addArgument
Add a command-line argument to specify dataset type name, if wanted.
Definition: argumentParser.py:186

lsst.pipe::base.argumentParser.ConfigFileAction
argparse action to load config overrides from one or more files
Definition: argumentParser.py:820

lsst.pipe::base.argumentParser.DataIdArgument.level
level
Definition: argumentParser.py:161

lsst.pipe::base.argumentParser.DataIdArgument.getDatasetType
def getDatasetType
Return the dataset type as a string.
Definition: argumentParser.py:171

lsst.pipe::base.argumentParser.DataIdContainer.__init__
def __init__
Construct a DataIdContainer.
Definition: argumentParser.py:82

lsst.pipe::base.argumentParser.DataIdContainer
A container for data IDs and associated data references.
Definition: argumentParser.py:73

lsst.pipe::base.argumentParser.DataIdContainer.idList
idList
Definition: argumentParser.py:86

lsst.pipe::base.argumentParser.DataIdArgument.name
name
Definition: argumentParser.py:159

lsst.pipe::base.argumentParser.ConfigDatasetType.name
name
Definition: argumentParser.py:265