LSSTApplications  19.0.0-14-gb0260a2+72efe9b372,20.0.0+7927753e06,20.0.0+8829bf0056,20.0.0+995114c5d2,20.0.0+b6f4b2abd1,20.0.0+bddc4f4cbe,20.0.0-1-g253301a+8829bf0056,20.0.0-1-g2b7511a+0d71a2d77f,20.0.0-1-g5b95a8c+7461dd0434,20.0.0-12-g321c96ea+23efe4bbff,20.0.0-16-gfab17e72e+fdf35455f6,20.0.0-2-g0070d88+ba3ffc8f0b,20.0.0-2-g4dae9ad+ee58a624b3,20.0.0-2-g61b8584+5d3db074ba,20.0.0-2-gb780d76+d529cf1a41,20.0.0-2-ged6426c+226a441f5f,20.0.0-2-gf072044+8829bf0056,20.0.0-2-gf1f7952+ee58a624b3,20.0.0-20-geae50cf+e37fec0aee,20.0.0-25-g3dcad98+544a109665,20.0.0-25-g5eafb0f+ee58a624b3,20.0.0-27-g64178ef+f1f297b00a,20.0.0-3-g4cc78c6+e0676b0dc8,20.0.0-3-g8f21e14+4fd2c12c9a,20.0.0-3-gbd60e8c+187b78b4b8,20.0.0-3-gbecbe05+48431fa087,20.0.0-38-ge4adf513+a12e1f8e37,20.0.0-4-g97dc21a+544a109665,20.0.0-4-gb4befbc+087873070b,20.0.0-4-gf910f65+5d3db074ba,20.0.0-5-gdfe0fee+199202a608,20.0.0-5-gfbfe500+d529cf1a41,20.0.0-6-g64f541c+d529cf1a41,20.0.0-6-g9a5b7a1+a1cd37312e,20.0.0-68-ga3f3dda+5fca18c6a4,20.0.0-9-g4aef684+e18322736b,w.2020.45
LSSTDataManagementBasePackage
ingestDriver.py
Go to the documentation of this file.
1 from lsst.ctrl.pool.pool import Pool, startPool, abortOnError
2 from lsst.ctrl.pool.parallel import BatchCmdLineTask
3 from lsst.pipe.base import Struct
4 from lsst.pipe.tasks.ingest import IngestTask, IngestError
5 
6 
8  """Parallel version of IngestTask"""
9  @classmethod
10  def batchWallTime(cls, time, parsedCmd, numCores):
11  return float(time)*len(parsedCmd.files)/numCores
12 
13  @classmethod
14  def _makeArgumentParser(cls, *args, **kwargs):
15  """Build an ArgumentParser
16 
17  Removes the batch-specific parts.
18  """
19  kwargs.pop("doBatch", False)
20  kwargs.pop("add_help", False)
21  return cls.ArgumentParser(*args, name="ingest", **kwargs)
22 
23  @classmethod
24  def parseAndRun(cls, *args, **kwargs):
25  """Run with a MPI process pool"""
26  pool = startPool()
27  config = cls.ConfigClass()
28  parser = cls.ArgumentParser(name=cls._DefaultName)
29  args = parser.parse_args(config)
30  task = cls(config=args.config)
31  task.run(args)
32  pool.exit()
33 
34  def runFileWrapper(self, struct, args):
35  """Run ingest on one file
36 
37  This is a wrapper method for calling ``runFile``.
38 
39  Parameters
40  ----------
41  struct : `lsst.pipe.base.Struct`
42  Structure containing ``filename`` (`str`) and ``position`` (`int`).
43  args : `argparse.Namespace`
44  Parsed command-line arguments.
45 
46  Returns
47  -------
48  hduInfoList : `list` of `dict`
49  Parsed information from FITS HDUs, or ``None``.
50  """
51  filename = struct.filename
52  position = struct.position
53  try:
54  return self.runFile(filename, None, args, position)
55  except IngestError as exc:
56  self.log.warn(f"Unable to ingest {filename}: {exc}")
57  return None
58 
59  @abortOnError
60  def run(self, args):
61  """Run ingest
62 
63  We read and ingest the files in parallel, and then
64  stuff the registry database in serial.
65  """
66  # Parallel
67  pool = Pool(None)
68  filenameList = self.expandFiles(args.files)
69  dataList = [Struct(filename=filename, position=ii) for ii, filename in enumerate(filenameList)]
70  infoList = pool.map(self.runFileWrapper, dataList, args)
71 
72  # Serial
73  root = args.input
74  context = self.register.openRegistry(root, create=args.create, dryrun=args.dryrun)
75  with context as registry:
76  for hduInfoList in infoList:
77  if hduInfoList is None:
78  continue
79  for info in hduInfoList:
80  self.register.addRow(registry, info, dryrun=args.dryrun, create=args.create)
81 
82  def writeConfig(self, *args, **kwargs):
83  pass
84 
85  def writeMetadata(self, *args, **kwargs):
86  pass
lsst::log.log.logContinued.warn
def warn(fmt, *args)
Definition: logContinued.py:205
lsst.pipe.drivers.ingestDriver.PoolIngestTask
Definition: ingestDriver.py:7
lsst.pipe.tasks.ingest.IngestTask.expandFiles
def expandFiles(self, fileNameList)
Expand a set of filenames and globs, returning a list of filenames.
Definition: ingest.py:537
lsst.pipe.tasks.ingest.IngestTask._DefaultName
_DefaultName
Definition: ingest.py:390
lsst.pipe.tasks.ingest.IngestTask
Definition: ingest.py:386
lsst.ctrl.pool.parallel
Definition: parallel.py:1
lsst::afw::geom.transform.transformContinued.cls
cls
Definition: transformContinued.py:33
lsst.pipe.drivers.ingestDriver.PoolIngestTask.writeConfig
def writeConfig(self, *args, **kwargs)
Definition: ingestDriver.py:82
lsst.ctrl.pool.pool.startPool
def startPool(comm=None, root=0, killSlaves=True)
Start a process pool.
Definition: pool.py:1216
lsst.pipe.drivers.ingestDriver.PoolIngestTask.batchWallTime
def batchWallTime(cls, time, parsedCmd, numCores)
Return walltime request for batch job.
Definition: ingestDriver.py:10
lsst.pipe.tasks.ingest.IngestTask.runFile
def runFile(self, infile, registry, args, pos)
Examine and ingest a single file.
Definition: ingest.py:556
lsst.pipe.drivers.ingestDriver.PoolIngestTask.writeMetadata
def writeMetadata(self, *args, **kwargs)
Definition: ingestDriver.py:85
lsst.pipe.tasks.ingest
Definition: ingest.py:1
lsst.pipe.base.struct.Struct
Definition: struct.py:26
lsst.pipe.base.task.Task.log
log
Definition: task.py:161
lsst.pipe.tasks.ingest.IngestTask.ArgumentParser
ArgumentParser
Definition: ingest.py:389
lsst.ctrl.pool.parallel.BatchCmdLineTask
Definition: parallel.py:432
lsst.pipe.drivers.ingestDriver.PoolIngestTask.parseAndRun
def parseAndRun(cls, *args, **kwargs)
Definition: ingestDriver.py:24
lsst.ctrl.pool.pool
Definition: pool.py:1
lsst.ctrl.pool.pool.Pool
Definition: pool.py:1205
lsst.pipe.drivers.ingestDriver.PoolIngestTask.run
def run(self, args)
Definition: ingestDriver.py:60
lsst.pipe.drivers.ingestDriver.PoolIngestTask.runFileWrapper
def runFileWrapper(self, struct, args)
Definition: ingestDriver.py:34
lsst.pipe.base
Definition: __init__.py:1
lsst.pipe.tasks.ingest.IngestTask.ConfigClass
ConfigClass
Definition: ingest.py:388