doxygen/xlink_master_2016_09_20_03.54.11/butler_8py_source.html

 #!/usr/bin/env python


 #

 # LSST Data Management System

 # Copyright 2008-2015 LSST Corporation.

 #

 # This product includes software developed by the

 # LSST Project (http://www.lsst.org/).

 #

 # This program is free software: you can redistribute it and/or modify

 # it under the terms of the GNU General Public License as published by

 # the Free Software Foundation, either version 3 of the License, or

 # (at your option) any later version.

 #

 # This program is distributed in the hope that it will be useful,

 # but WITHOUT ANY WARRANTY; without even the implied warranty of

 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 # GNU General Public License for more details.

 #

 # You should have received a copy of the LSST License Statement and

 # the GNU General Public License along with this program.  If not,

 # see <http://www.lsstcorp.org/LegalNotices/>.

 #


 # -*- python -*-


 """This module defines the Butler class."""

 from future import standard_library

 standard_library.install_aliases()

 from builtins import str

 from past.builtins import basestring

 from builtins import object


 import collections

 import copy

 import inspect

 import os


 import yaml


 from lsst.log import Log

 import lsst.pex.policy as pexPolicy

 from . import LogicalLocation, ReadProxy, ButlerSubset, ButlerDataRef, Persistence, \

     Storage, Policy, NoResults, Repository, DataId, RepositoryCfg, \

     RepositoryArgs, listify, setify, sequencify, doImport


 class ButlerCfg(Policy, yaml.YAMLObject):

     """Represents a Butler configuration.


         .. warning::


         cfg is 'wet paint' and very likely to change. Use of it in production

         code other than via the 'old butler' API is strongly discouraged.

     """

     yaml_tag = u"!ButlerCfg"


     def __init__(self, cls, repoCfg):

         super(ButlerCfg, self).__init__({'repoCfg': repoCfg, 'cls': cls})


 class RepoData(object):

     """Container object for repository data used by Butler"""


     def __init__(self, args, cfg, repo, tags):

         """Initializer for RepoData


         @param args (RepositoryArgs) Arguments used to initialize self.repo

         @param cfg (RepositoryCfg) Configuration of repository (this is persisted)

         @param repo (Repository) The repository class instance

         @param tags (set) The tags that apply to this repository, if any

         """

         self.args = args

         self.cfg = cfg

         self.repo = repo

         self.mode = args.mode

         # self.tags is used to keep track of *all* the applicable tags to the Repo, not just the tags in

         # the cfg (e.g. parents inherit their childrens' tags)

         if not isinstance(tags, set):

             raise RuntimeError("tags passed into RepoData must be in a set.")

         self.tags = tags


     def __reduce__(self):

         return (RepoData, (self.args, self.cfg, self.repo, self.mode, self.tags))


     def __repr__(self):

         return "RepoData(args=%s cfg=%s repo=%s tags=%s" % (self.args, self.cfg, self.repo, self.tags)


 class RepoDataContainer(object):

     """Container object for RepoData instances owned by a Butler instance."""


     def __init__(self):

         self.byRepoRoot = collections.OrderedDict()  # {repo root, RepoData}

         self.byCfgRoot = {}                          # {repo cfgRoot, RepoData}

         self._inputs = None

         self._outputs = None

         self._all = None


     def add(self, repoData):

         """Add a RepoData to the container


         @param (RepoData) RepoData instance to add

         """

         self._inputs = None

         self._outputs = None

         self._all = None

         self.byRepoRoot[repoData.cfg.root] = repoData

         self.byCfgRoot[repoData.args.cfgRoot] = repoData


     def inputs(self):

         """Get a list of RepoData that are used to as inputs to the Butler.


         The list is created lazily as needed, and cached.

         @return a list of RepoData with readable repositories. List is in the order to be use when searching.

         """

         if self._inputs is None:

             self._inputs = [rd for rd in self.byRepoRoot.values() if 'r' in rd.mode]

         return self._inputs


     def outputs(self):

         """Get a list of RepoData that are used to as outputs to the Butler.


         The list is created lazily as needed, and cached.

         @return a list of RepoData with writable repositories. List is in the order to be use when searching.

         """

         if self._outputs is None:

             self._outputs = [rd for rd in self.byRepoRoot.values() if 'w' in rd.mode]

         return self._outputs


     def all(self):

         """Get a list of all RepoData that are used to as by the Butler.


         The list is created lazily as needed, and cached.

         @return a list of RepoData with writable repositories. List is in the order to be use when searching.

         """

         if self._all is None:

             self._all = [rd for rd in self.byRepoRoot.values()]

         return self._all


     def __repr__(self):

         return "%s(\nbyRepoRoot=%r, \nbyCfgRoot=%r, \n_inputs=%r, \n_outputs=%s, \n_all=%s)" % (

             self.__class__.__name__,

             self.byRepoRoot,

             self.byCfgRoot,

             self._inputs,

             self._outputs,

             self._all)


 class Butler(object):

     """Butler provides a generic mechanism for persisting and retrieving data using mappers.


     A Butler manages a collection of datasets known as a repository.  Each

     dataset has a type representing its intended usage and a location.  Note

     that the dataset type is not the same as the C++ or Python type of the

     object containing the data.  For example, an ExposureF object might be

     used to hold the data for a raw image, a post-ISR image, a calibrated

     science image, or a difference image.  These would all be different

     dataset types.


     A Butler can produce a collection of possible values for a key (or tuples

     of values for multiple keys) if given a partial data identifier.  It can

     check for the existence of a file containing a dataset given its type and

     data identifier.  The Butler can then retrieve the dataset.  Similarly, it

     can persist an object to an appropriate location when given its associated

     data identifier.


     Note that the Butler has two more advanced features when retrieving a data

     set.  First, the retrieval is lazy.  Input does not occur until the data

     set is actually accessed.  This allows datasets to be retrieved and

     placed on a clipboard prospectively with little cost, even if the

     algorithm of a stage ends up not using them.  Second, the Butler will call

     a standardization hook upon retrieval of the dataset.  This function,

     contained in the input mapper object, must perform any necessary

     manipulations to force the retrieved object to conform to standards,

     including translating metadata.


     Public methods:


     __init__(self, root, mapper=None, **mapperArgs)


     defineAlias(self, alias, datasetType)


     getKeys(self, datasetType=None, level=None)


     queryMetadata(self, datasetType, keys, format=None, dataId={}, **rest)


     datasetExists(self, datasetType, dataId={}, **rest)


     get(self, datasetType, dataId={}, immediate=False, **rest)


     put(self, obj, datasetType, dataId={}, **rest)


     subset(self, datasetType, level=None, dataId={}, **rest)


     dataRef(self, datasetType, level=None, dataId={}, **rest)

     """


     def __init__(self, root=None, mapper=None, inputs=None, outputs=None, **mapperArgs):

         """Initializer for the Class.


         The prefered initialization argument is to pass a single arg; cfg created by Butler.cfg();

             butler = Butler(Butler.cfg(repoCfg))

         For backward compatibility: this initialization method signature can take a posix root path, and

         optionally a mapper class instance or class type that will be instantiated using the mapperArgs input

         argument.

         However, for this to work in a backward compatible way it creates a single repository that is used as

         both an input and an output repository. This is NOT preferred, and will likely break any provenance

         system we have in place.


         @param root (str) Best practice is to pass in a cfg created by Butler.cfg(). But for backward

                           compatibility this can also be a fileysystem path. Will only work with a

                           PosixRepository.

         @param mapper Deprecated. Provides a mapper to be used with Butler.

         @param mapperArgs Deprecated. Provides arguments to be passed to the mapper if the mapper input arg

                            is a class type to be instantiated by Butler.

         @param inputs (RepositoryArg or string) Can be a single item or a list. Provides arguments to load an

                                                 existing repository (or repositories). String is assumed to be

                                                 a URI and is used as the cfgRoot (URI to the location of the

                                                 cfg file). (Local file system URI does not have to start with

                                                 'file://' and in this way can be a relative path).

         @param outputs (RepositoryArg) Can be a single item or a list. Provides arguments to load one or more

                                        existing repositories or create new ones. String is assumed to be a

                                        URI and as used as the repository root.


         :return:

         """

         self._initArgs = {'root': root, 'mapper': mapper, 'inputs': inputs, 'outputs': outputs,

                           'mapperArgs': mapperArgs}


         isLegacyRepository = inputs is None and outputs is None


         if root is not None and not isLegacyRepository:

             raise RuntimeError(

                 'root is a deprecated parameter and may not be used with the parameters input and output')


         if isLegacyRepository:

             if root is None:

                 if hasattr(mapper, 'root'):

                     # in legacy repos, the mapper may be given the root directly.

                     root = mapper.root

                 else:

                     # in the past root="None" could be used to mean root='.'

                     root = '.'

             outputs = RepositoryArgs(mode='rw',

                                      root=root,

                                      mapper=mapper,

                                      mapperArgs=mapperArgs)

             outputs.isLegacyRepository = True


         self.datasetTypeAliasDict = {}


         # Always use an empty Persistence policy until we can get rid of it

         persistencePolicy = pexPolicy.Policy()

         self.persistence = Persistence.getPersistence(persistencePolicy)

         self.log = Log.getLogger("daf.persistence.butler")


         inputs = listify(inputs)

         outputs = listify(outputs)


         # if only a string is passed for inputs or outputs, assumption is that it's a URI;

         # place it in a RepositoryArgs instance; cfgRoot for inputs, root for outputs.

         inputs = [RepositoryArgs(cfgRoot=i) if isinstance(i, basestring) else i for i in inputs]

         outputs = [RepositoryArgs(root=o) if isinstance(o, basestring) else o for o in outputs]


         # set default rw modes on input and output args as needed

         for i in inputs:

             if i.mode is None:

                 i.mode = 'r'

         for o in outputs:

             if o.mode is None:

                 o.mode = 'w'


         self._repos = RepoDataContainer()


         defaultMapper = self._getDefaultMapper(inputs)


         butlerIOParents = collections.OrderedDict()

         for args in outputs + inputs:

             if 'r' in args.mode:

                 butlerIOParents[args.cfgRoot] = args


         for args in outputs:

             self._addRepo(args, inout='out', defaultMapper=defaultMapper, butlerIOParents=butlerIOParents)


         for args in inputs:

             self._addRepo(args, inout='in', butlerIOParents=butlerIOParents)


     def _addRepo(self, args, inout, defaultMapper=None, butlerIOParents=None, tags=None):

         """Create a Repository and related infrastructure and add it to the list of repositories.


         @param args (RepositoryArgs) settings used to create the repository.

         @param inout (string) must be 'in' our 'out', indicates how the repository is to be used. Input repos

                               are only read from, and output repositories may be read from and/or written to

                               (w/rw of output repos depends on args.mode)

         @param defaultMapper (mapper class or None ) if a default mapper could be inferred from inputs then

                                                      this will be a class object that can be used for any

                                                      outputs that do not explicitly define their mapper. If

                                                      None then a mapper class could not be inferred and a

                                                      mapper must be defined by each output.

         @param butlerIOParents (ordered dict) The keys are cfgRoot of repoArgs, val is the repoArgs.

                                               This is all the explicit input and output repositories to the

                                               butler __init__ function, it is used when determining what the

                                               parents of writable repositories are.

         @param tags (any or list of any) Any object that can be tested to be the same as the tag in a dataId

                                          passed into butler input functions. Applies only to input

                                          repositories: If tag is specified by the dataId then the repo will

                                          only be read from used if the tag in the dataId matches a tag used

                                          for that repository.

         """

         if butlerIOParents is None:

             butlerIOParents = {}


         tags = copy.copy(setify(tags))

         tags.update(args.tags)


         # If this repository has already been loaded/created, compare the input args to the exsisting repo;

         # if they don't match raise an exception - the caller has to sort this out.

         if args.cfgRoot in self._repos.byCfgRoot:

             repoData = self._repos.byCfgRoot[args.cfgRoot]

             if not repoData.cfg.matchesArgs(args):

                 raise RuntimeError("Mismatched repository configurations passed in or loaded:" +

                                    "\n\tnew args:%s" +

                                    "\n\texisting repoData:%s" %

                                    (args, repoData))

             repoData.tags.update(setify(tags))

         else:

             # If we are here, the repository is not yet loaded by butler. Do the loading:


             # Verify mode is legal (must be writeable for outputs, readable for inputs).

             # And set according to the default value if needed.

             if inout == 'out':

                 if 'w' not in args.mode:

                     raise RuntimeError('Output repositories must be writable.')

             elif inout == 'in':

                 if 'r' not in args.mode:

                     raise RuntimeError('Input repositories must be readable.')

             else:

                 raise RuntimeError('Unrecognized value for inout:' % inout)


             # Try to get the cfg.

             # If it exists, verify no mismatch with args.

             # If it does not exist, make the cfg and save the cfg at cfgRoot.

             cfg = Storage.getRepositoryCfg(args.cfgRoot)


             parentsToAdd = []

             if cfg is not None:

                 if inout == 'out':

                     # Parents used by this butler instance must match the parents of any existing output

                     # repositories used by this butler. (If there is a configuration change a new output

                     # repository should be created).

                     # IE cfg.parents can have parents that are not passed in as butler inputs or readable

                     # outputs, but the butler may not have readable i/o that is not a parent of an already

                     # existing output.

                     for cfgRoot in butlerIOParents:

                         if cfgRoot not in cfg.parents and cfgRoot != args.cfgRoot:

                             raise RuntimeError(

                                 "Existing output repository parents do not match butler's inputs.")

                 if not cfg.matchesArgs(args):

                     raise RuntimeError(

                         "Persisted RepositoryCfg and passed-in RepositoryArgs have"

                         " conflicting parameters:\n" + "\t%s\n\t%s", (cfg, args))

                 if args.mapperArgs is not None:

                     if cfg.mapperArgs is None:

                         cfg.mapperArgs = args.mapperArgs

                     else:

                         cfg.mapperArgs.update(args.mapperArgs)

                 if 'r' in args.mode:

                     parentsToAdd = copy.copy(cfg.parents)

             else:

                 if args.mapper is None:

                     if defaultMapper is None:

                         raise RuntimeError(

                             "Could not infer mapper and one not specified in repositoryArgs:%s" % args)

                     args.mapper = defaultMapper

                 parents = [cfgRoot for cfgRoot in list(butlerIOParents.keys()) if cfgRoot != args.cfgRoot]

                 cfg = RepositoryCfg.makeFromArgs(args, parents)

                 Storage.putRepositoryCfg(cfg, args.cfgRoot)


             repo = Repository(cfg)

             self._repos.add(RepoData(args, cfg, repo, tags))

             for parent in parentsToAdd:

                 if parent in butlerIOParents:

                     args = butlerIOParents[parent]

                 else:

                     args = RepositoryArgs(cfgRoot=parent, mode='r')

                 self._addRepo(args=args, inout='in', tags=tags)


     def __repr__(self):

         return 'Butler(datasetTypeAliasDict=%s, repos=%s, persistence=%s)' % (

             self.datasetTypeAliasDict, self._repos, self.persistence)


     @staticmethod

     def _getDefaultMapper(inputs):

         mappers = set()

         for args in inputs:

             if args.mapper is not None:

                 mapper = args.mapper

                 # if the mapper is:

                 # * a string, import it.

                 # * a class instance, get its class type

                 # * a class, do nothing; use it

                 if isinstance(mapper, basestring):

                     mapper = doImport(args.mapper)

                 elif not inspect.isclass(mapper):

                     mapper = mapper.__class__

             else:

                 cfgRoot = args.cfgRoot

                 mapper = Butler.getMapperClass(cfgRoot)

             mappers.add(mapper)


         if len(mappers) == 1:

             return mappers.pop()

         else:

             return None


     @staticmethod

     def getMapperClass(root):

         """posix-only; gets the mapper class at the path specifed by root (if a file _mapper can be found at

         that location or in a parent location.


         As we abstract the storage and support different types of storage locaitons this method will be

         moved entirely into Butler Access, or made more dynamic, and the API will very likely change."""

         return Storage.getMapperClass(root)


     def defineAlias(self, alias, datasetType):

         """Register an alias that will be substituted in datasetTypes.


         @param alias (str) the alias keyword. it may start with @ or not. It may not contain @ except as the

                            first character.

         @param datasetType (str) the string that will be substituted when @alias is passed into datasetType.

                                  It may not contain '@'

         """


         # verify formatting of alias:

         # it can have '@' as the first character (if not it's okay, we will add it) or not at all.

         atLoc = alias.rfind('@')

         if atLoc == -1:

             alias = "@" + str(alias)

         elif atLoc > 0:

             raise RuntimeError("Badly formatted alias string: %s" % (alias,))


         # verify that datasetType does not contain '@'

         if datasetType.count('@') != 0:

             raise RuntimeError("Badly formatted type string: %s" % (datasetType))


         # verify that the alias keyword does not start with another alias keyword,

         # and vice versa

         for key in self.datasetTypeAliasDict:

             if key.startswith(alias) or alias.startswith(key):

                 raise RuntimeError("Alias: %s overlaps with existing alias: %s" % (alias, key))


         self.datasetTypeAliasDict[alias] = datasetType


     def getKeys(self, datasetType=None, level=None, tag=None):

         """Returns a dict.  The dict keys are the valid data id keys at or above the given level of hierarchy

         for the dataset type or the entire collection if None.  The dict values are the basic Python types

         corresponding to the keys (int, float, str).


         @param datasetType (str) the type of dataset to get keys for, entire collection if None.

         @param level (str) the hierarchy level to descend to. None if it should not be restricted. Use an

                            empty string if the mapper should lookup the default level.

         @param tags (any or list of any) Any object that can be tested to be the same as the tag in a dataId

                                          passed into butler input functions. Applies only to input

                                          repositories: If tag is specified by the dataId then the repo will

                                          only be read from used if the tag in the dataId matches a tag used

                                          for that repository.

         @returns (dict) valid data id keys; values are corresponding types.

         """

         datasetType = self._resolveDatasetTypeAlias(datasetType)


         keys = None

         tag = setify(tag)

         for repoData in self._repos.inputs():

             if not tag or len(tag.intersection(repoData.tags)) > 0:

                 keys = repoData.repo.getKeys(datasetType, level)

                 # An empty dict is a valid "found" condition for keys. The only value for keys that should

                 # cause the search to continue is None

                 if keys is not None:

                     break

         return keys


     def queryMetadata(self, datasetType, format=None, dataId={}, **rest):

         """Returns the valid values for one or more keys when given a partial

         input collection data id.


         @param datasetType (str) the type of dataset to inquire about.

         @param key (str) a key giving the level of granularity of the inquiry.

         @param format (str, tuple) an optional key or tuple of keys to be returned.

         @param dataId (DataId, dict) the partial data id.

         @param **rest keyword arguments for the partial data id.

         @returns (list) a list of valid values or tuples of valid values as

         specified by the format (defaulting to the same as the key) at the

         key's level of granularity.

         """


         datasetType = self._resolveDatasetTypeAlias(datasetType)

         dataId = DataId(dataId)

         dataId.update(**rest)


         if format is None:

             format = (key,)

         else:

             format = sequencify(format)


         tuples = None

         for repoData in self._repos.inputs():

             if not dataId.tag or len(dataId.tag.intersection(repoData.tags)) > 0:

                 tuples = repoData.repo.queryMetadata(datasetType, format, dataId)

                 if tuples:

                     break


         if not tuples:

             return []


         if len(format) == 1:

             ret = []

             for x in tuples:

                 try:

                     ret.append(x[0])

                 except TypeError:

                     ret.append(x)

             return ret


         return tuples


     def datasetExists(self, datasetType, dataId={}, **rest):

         """Determines if a dataset file exists.


         @param datasetType (str) the type of dataset to inquire about.

         @param dataId (DataId, dict) the data id of the dataset.

         @param **rest keyword arguments for the data id.

         @returns (bool) True if the dataset exists or is non-file-based.

         """


         datasetType = self._resolveDatasetTypeAlias(datasetType)

         dataId = DataId(dataId)

         dataId.update(**rest)


         location = None

         for repoData in self._repos.inputs():

             if not dataId.tag or len(dataId.tag.intersection(repoData.tags)) > 0:

                 location = repoData.repo.map(datasetType, dataId)

                 if location:

                     break


         if location is None:

             return False


         additionalData = location.getAdditionalData()

         storageName = location.getStorageName()

         if storageName in ('BoostStorage', 'FitsStorage', 'PafStorage',

                            'PickleStorage', 'ConfigStorage', 'FitsCatalogStorage'):

             locations = location.getLocations()

             for locationString in locations:

                 logLoc = LogicalLocation(locationString, additionalData).locString()

                 if storageName == 'FitsStorage':

                     # Strip off directives for cfitsio (in square brackets, e.g., extension name)

                     bracket = logLoc.find('[')

                     if bracket > 0:

                         logLoc = logLoc[:bracket]

                 if not os.path.exists(logLoc):

                     return False

             return True

         self.log.warn("datasetExists() for non-file storage %s, dataset type=%s, keys=%s",

                       storageName, datasetType, str(dataId))

         return True


     def get(self, datasetType, dataId=None, immediate=False, **rest):

         """Retrieves a dataset given an input collection data id.


         @param datasetType (str)   the type of dataset to retrieve.

         @param dataId (dict)       the data id.

         @param immediate (bool)    don't use a proxy for delayed loading.

         @param **rest              keyword arguments for the data id.

         @returns an object retrieved from the dataset (or a proxy for one).

         """


         datasetType = self._resolveDatasetTypeAlias(datasetType)

         dataId = DataId(dataId)

         dataId.update(**rest)

         location = None

         for repoData in self._repos.inputs():

             if not dataId.tag or len(dataId.tag.intersection(repoData.tags)) > 0:

                 location = repoData.repo.map(datasetType, dataId)

                 if location:

                     break

         if location is None:

             raise NoResults("No locations for get:", datasetType, dataId)


         self.log.debug("Get type=%s keys=%s from %s", datasetType, dataId, str(location))


         if hasattr(location.mapper, "bypass_" + datasetType):

             # this type loader block should get moved into a helper someplace, and duplciations removed.

             pythonType = location.getPythonType()

             if pythonType is not None:

                 if isinstance(pythonType, basestring):

                     # import this pythonType dynamically

                     pythonTypeTokenList = location.getPythonType().split('.')

                     importClassString = pythonTypeTokenList.pop()

                     importClassString = importClassString.strip()

                     importPackage = ".".join(pythonTypeTokenList)

                     importType = __import__(importPackage, globals(), locals(), [importClassString], 0)

                     pythonType = getattr(importType, importClassString)

             bypassFunc = getattr(location.mapper, "bypass_" + datasetType)

             callback = lambda: bypassFunc(datasetType, pythonType, location, dataId)

         else:

             callback = lambda: self._read(location)

         if location.mapper.canStandardize(datasetType):

             innerCallback = callback

             callback = lambda: location.mapper.standardize(datasetType, innerCallback(), dataId)

         if immediate:

             return callback()

         return ReadProxy(callback)


     def put(self, obj, datasetType, dataId={}, doBackup=False, **rest):

         """Persists a dataset given an output collection data id.


         @param obj                 the object to persist.

         @param datasetType (str)   the type of dataset to persist.

         @param dataId (dict)       the data id.

         @param doBackup            if True, rename existing instead of overwriting

         @param **rest              keyword arguments for the data id.


         WARNING: Setting doBackup=True is not safe for parallel processing, as it

         may be subject to race conditions.

         """


         datasetType = self._resolveDatasetTypeAlias(datasetType)

         dataId = DataId(dataId)

         dataId.update(**rest)


         for repoData in self._repos.outputs():

             location = repoData.repo.map(datasetType, dataId, write=True)

             if location:

                 if doBackup:

                     repoData.repo.backup(datasetType, dataId)

                 repoData.repo.write(location, obj)


     def subset(self, datasetType, level=None, dataId={}, **rest):

         """Extracts a subset of a dataset collection.


         Given a partial dataId specified in dataId and **rest, find all

         datasets at a given level specified by a dataId key (e.g. visit or

         sensor or amp for a camera) and return a collection of their dataIds

         as ButlerDataRefs.


         @param datasetType (str)  the type of dataset collection to subset

         @param level (str)        the level of dataId at which to subset. Use an empty string if the mapper

                                   should look up the default level.

         @param dataId (dict)      the data id.

         @param **rest             keyword arguments for the data id.

         @returns (ButlerSubset) collection of ButlerDataRefs for datasets

         matching the data id.

         """


         datasetType = self._resolveDatasetTypeAlias(datasetType)


         # Currently expected behavior of subset is that if specified level is None then the mapper's default

         # level should be used. Convention for level within Butler is that an empty string is used to indicate

         # 'get default'.

         if level is None:

             level = ''


         dataId = DataId(dataId)

         dataId.update(**rest)

         return ButlerSubset(self, datasetType, level, dataId)


     def dataRef(self, datasetType, level=None, dataId={}, **rest):

         """Returns a single ButlerDataRef.


         Given a complete dataId specified in dataId and **rest, find the

         unique dataset at the given level specified by a dataId key (e.g.

         visit or sensor or amp for a camera) and return a ButlerDataRef.


         @param datasetType (str)  the type of dataset collection to reference

         @param level (str)        the level of dataId at which to reference

         @param dataId (dict)      the data id.

         @param **rest             keyword arguments for the data id.

         @returns (ButlerDataRef) ButlerDataRef for dataset matching the data id

         """


         datasetType = self._resolveDatasetTypeAlias(datasetType)

         dataId = DataId(dataId)

         subset = self.subset(datasetType, level, dataId, **rest)

         if len(subset) != 1:

             raise RuntimeError("No unique dataset for: Dataset type:%s Level:%s Data ID:%s Keywords:%s" %

                                (str(datasetType), str(level), str(dataId), str(rest)))

         return ButlerDataRef(subset, subset.cache[0])


     def _read(self, location):

         self.log.debug("Starting read from %s", location)

         results = location.repository.read(location)

         if len(results) == 1:

             results = results[0]

         self.log.debug("Ending read from %s", location)

         return results


     def __reduce__(self):

         ret = (_unreduce, (self._initArgs, self.datasetTypeAliasDict))

         return ret


     def _resolveDatasetTypeAlias(self, datasetType):

         """ Replaces all the known alias keywords in the given string with the alias value.

         @param (str)datasetType

         @return (str) the de-aliased string

         """


         for key in self.datasetTypeAliasDict:

             # if all aliases have been replaced, bail out

             if datasetType.find('@') == -1:

                 break

             datasetType = datasetType.replace(key, self.datasetTypeAliasDict[key])


         # If an alias specifier can not be resolved then throw.

         if datasetType.find('@') != -1:

             raise RuntimeError("Unresolvable alias specifier in datasetType: %s" % (datasetType))


         return datasetType


 def _unreduce(initArgs, datasetTypeAliasDict):

     mapperArgs = initArgs.pop('mapperArgs')

     initArgs.update(mapperArgs)

     butler = Butler(**initArgs)

     butler.datasetTypeAliasDict = datasetTypeAliasDict

     return butler

lsst::daf::persistence.butler.Butler.get
def get
Definition: butler.py:570

lsst::daf::persistence.butler.Butler.subset
def subset
Definition: butler.py:641

lsst::daf::persistence.butler.Butler._initArgs
_initArgs
Definition: butler.py:229

lsst::daf::persistence.butler.RepoData.tags
tags
Definition: butler.py:81

lsst::daf::persistence.butler.Butler.persistence
persistence
Definition: butler.py:256

lsst::daf::persistence.butler.RepoDataContainer.inputs
def inputs
Definition: butler.py:111

lsst::daf::persistence.butler.RepoData.cfg
cfg
Definition: butler.py:74

lsst.pex.policy
Definition: __init__.py:1

lsst::daf::persistence.butler.Butler.getKeys
def getKeys
Definition: butler.py:456

lsst::daf::persistence.butler.RepoDataContainer.outputs
def outputs
Definition: butler.py:121

lsst::daf::persistence.butler.ButlerCfg.__init__
def __init__
Definition: butler.py:58

lsst::daf::persistence.butler.RepoDataContainer._outputs
_outputs
Definition: butler.py:97

lsst.pex.policy::Policy
a container for holding hierarchical configuration data in memory.
Definition: Policy.h:169

lsst::daf::persistence.butler.RepoDataContainer.__init__
def __init__
Definition: butler.py:93

lsst::daf::persistence.utils.doImport
def doImport
Definition: utils.py:104

lsst::daf::persistence.butler.Butler
Definition: butler.py:151

lsst::daf::persistence.butler.Butler.__repr__
def __repr__
Definition: butler.py:390

lsst::daf::persistence.butler.Butler.put
def put
Definition: butler.py:617

lsst::daf::persistence.butler.Butler.dataRef
def dataRef
Definition: butler.py:670

lsst::daf::persistence.butler.RepoDataContainer._all
_all
Definition: butler.py:98

lsst::daf::persistence.butler.Butler._addRepo
def _addRepo
Definition: butler.py:290

lsst::daf::persistence.butler.Butler._resolveDatasetTypeAlias
def _resolveDatasetTypeAlias
Definition: butler.py:704

lsst::daf::persistence.butler.ButlerCfg
Definition: butler.py:48

lsst::log
Definition: Log.h:716

lsst::daf::persistence.butler.RepoDataContainer.byRepoRoot
byRepoRoot
Definition: butler.py:94

lsst::daf::persistence.butler.Butler.queryMetadata
def queryMetadata
Definition: butler.py:484

lsst::daf::persistence.utils.setify
def setify
Definition: utils.py:80

lsst::daf::persistence.butler.RepoData.args
args
Definition: butler.py:73

lsst::daf::persistence.butler.Butler.defineAlias
def defineAlias
Definition: butler.py:427

lsst::daf::persistence.butler.Butler.getMapperClass
def getMapperClass
Definition: butler.py:419

lsst::daf::persistence.butler.RepoDataContainer.all
def all
Definition: butler.py:131

lsst::daf::persistence.butler.Butler.datasetTypeAliasDict
datasetTypeAliasDict
Definition: butler.py:252

lsst::daf::persistence.butler.RepoDataContainer
Definition: butler.py:90

lsst::daf::persistence.butler.RepoData.repo
repo
Definition: butler.py:75

lsst::daf::persistence.utils.listify
def listify
Definition: utils.py:34

lsst::daf::persistence.butler.Butler.__init__
def __init__
Definition: butler.py:200

lsst::daf::persistence.butler.RepoData.__repr__
def __repr__
Definition: butler.py:86

lsst::daf::persistence.butler.RepoData.mode
mode
Definition: butler.py:76

lsst::daf::persistence.butler.RepoDataContainer.byCfgRoot
byCfgRoot
Definition: butler.py:95

lsst::daf::persistence.butler.Butler._read
def _read
Definition: butler.py:692

lsst::daf::persistence.butler.RepoDataContainer.__repr__
def __repr__
Definition: butler.py:141

lsst::daf::persistence.butler.Butler._getDefaultMapper
def _getDefaultMapper
Definition: butler.py:395

lsst::daf::persistence.butler.RepoDataContainer.add
def add
Definition: butler.py:100

lsst::daf::persistence.butler.Butler.log
log
Definition: butler.py:257

lsst::daf::persistence.butler.Butler._repos
_repos
Definition: butler.py:275

lsst::daf::persistence.butler.RepoData.__reduce__
def __reduce__
Definition: butler.py:83

lsst::daf::persistence.butler._unreduce
def _unreduce
Definition: butler.py:723

lsst::daf::persistence.utils.sequencify
def sequencify
Definition: utils.py:70

lsst::daf::persistence.butler.RepoDataContainer._inputs
_inputs
Definition: butler.py:96

lsst::daf::persistence.butler.RepoData
Definition: butler.py:62

lsst::daf::persistence.butler.Butler.datasetExists
def datasetExists
Definition: butler.py:528

lsst::daf::persistence.butler.Butler.__reduce__
def __reduce__
Definition: butler.py:700

lsst::daf::persistence.butler.RepoData.__init__
def __init__
Definition: butler.py:65