LSSTApplications: lsst.datarel.schema Namespace Reference

def lsst.datarel.schema._getMappingKw	(	slots,
		sourceProcessingConfig,
		measPrefix = `None`
	)

private

Return substitution parameters for mapping table entries.

Definition at line 332 of file schema.py.

 
 def _getMappingKw(slots, sourceProcessingConfig, measPrefix=None):
     """Return substitution parameters for mapping table entries.
     """
     kw = dict()
     kw['measPrefix'] = (measPrefix or '').replace('.', '_')
     kw['exposurePrefix'] = sourceProcessingConfig.exposurePrefix.replace('.', '_')
     kw['clusterPrefix'] = sourceProcessingConfig.clusterPrefix.replace('.', '_')
     kw['centroid'] = slots.centroid.replace('.', '_') if slots.centroid else '__X__'
     kw['shape'] = slots.shape.replace('.', '_') if slots.shape else '__X__'
     kw['psfFlux'] = slots.psfFlux.replace('.', '_') if slots.psfFlux else '__X__'
     kw['apFlux'] = slots.apFlux.replace('.', '_') if slots.apFlux else '__X__'
     kw['modelFlux'] = slots.modelFlux.replace('.', '_') if slots.modelFlux else '__X__'
     kw['instFlux'] = slots.instFlux.replace('.', '_') if slots.instFlux else '__X__'
     return kw

lsst.datarel.schema._getMappingKw

def _getMappingKw

Definition: schema.py:332

def lsst.datarel.schema._k ( cols )

private

Definition at line 51 of file schema.py.

 
 def _k(cols):
     if not isinstance(cols, basestring):
         idx = '_'.join(cols)
         cols = ', '.join(cols)
     else:
         idx = cols
     return str.format('KEY IDX_{0} ({0})', idx, cols)
 

lsst.datarel.schema._k

def _k

Definition: schema.py:51

def lsst.datarel.schema._pk ( cols )

private

Definition at line 46 of file schema.py.

 
 def _pk(cols):
     if not isinstance(cols, basestring):
         cols = ', '.join(colName)
     return str.format('PRIMARY KEY ({0})', cols)

lsst.datarel.schema._pk

def _pk

Definition: schema.py:46

def lsst.datarel.schema._sourceIndexes ( sourceProcessingConfig )

private

Return the list of C++ Source field names to create indexes on.

@param sourceProcessingConfig     lsst.ap.cluster.SourceProcessingConfig;
                                  describes source processing performed by
                                  SourceAssoc.

Definition at line 236 of file schema.py.

 
 def _sourceIndexes(sourceProcessingConfig):
     """Return the list of C++ Source field names to create indexes on.
 
     @param sourceProcessingConfig     lsst.ap.cluster.SourceProcessingConfig;
                                       describes source processing performed by
                                       SourceAssoc.
     """
     indexes = set()
     indexes.add("parent")
     if sourceProcessingConfig.exposurePrefix:
        indexes.add(sourceProcessingConfig.exposurePrefix + ".id")
        if not sourceProcessingConfig.multiBand:
            indexes.add(sourceProcessingConfig.exposurePrefix + ".filter.id")
     if sourceProcessingConfig.clusterPrefix:
         indexes.add(sourceProcessingConfig.clusterPrefix + ".id")
     return indexes
  
 
# mappings from run-specific table column names to canonical Source columns

lsst.datarel.schema._sourceIndexes

def _sourceIndexes

Definition: schema.py:236

def lsst.datarel.schema.coaddSourceTableSql	(	coaddName,
		schema,
		sourceConversionConfig,
		asView,
		sourceProcessingConfig,
		slotConfig,
		measPrefix
	)

Return a tuple of SQL statements (createStmt, loadStmt, sourceStmt)
for a coadd source table. The canonical table name is obtained by
captilizing the first letter of coaddName and appending 'Source'. The
run specific table name is derived from the former by prepending 'Run'.

createStmt :    CREATE TABLE statement for the Run<CoaddName>Source table,
                which includes all fields from the run-specific
                lsst.afw.table.Schema for source tables output by the
                pipelines.

loadStmt :      LOAD DATA statement for the Run<CoaddName>Source table.
                This is a format string; to generate valid SQL a fileName
                must be supplied, e.g.:

                loadStmt.format(fileName='source.csv')

sourceStmt :    Map the Run<CoaddName>Source table to the canonical
                <CoaddName>Source schema. This will either create a VIEW,
                or INSERT into the materialized equivalent.

@param coaddName
    Coadd name (camel-case), e.g. 'deep' or 'goodSeeing'.
@param schema
    lsst.afw.table.Schema for coadd-sources.   
@param sourceConversionConfig
    lsst.ap.utils.CsvConversionConfig - parameters used for
    C++ to CSV conversion.
@param asView
    True if the canonical table should be constructed as a VIEW on
    top of the run-specific table.
@param sourceProcessingConfig
    lsst.ap.cluster.SourceProcessingConfig - parameters used to
    denormalize the C++ schema produced by the pipeline.
@param slotConfig
    lsst.meas.algorithms.SlotConfig - pipeline slot mappings.
@param measPrefix
    Prefix for measurement field names.

Definition at line 630 of file schema.py.

 
                         measPrefix):
     """Return a tuple of SQL statements (createStmt, loadStmt, sourceStmt)
     for a coadd source table. The canonical table name is obtained by
     captilizing the first letter of coaddName and appending 'Source'. The
     run specific table name is derived from the former by prepending 'Run'.
 
     createStmt :    CREATE TABLE statement for the Run<CoaddName>Source table,
                     which includes all fields from the run-specific
                     lsst.afw.table.Schema for source tables output by the
                     pipelines.
 
     loadStmt :      LOAD DATA statement for the Run<CoaddName>Source table.
                     This is a format string; to generate valid SQL a fileName
                     must be supplied, e.g.:
 
                     loadStmt.format(fileName='source.csv')
 
     sourceStmt :    Map the Run<CoaddName>Source table to the canonical
                     <CoaddName>Source schema. This will either create a VIEW,
                     or INSERT into the materialized equivalent.
 
     @param coaddName
         Coadd name (camel-case), e.g. 'deep' or 'goodSeeing'.
     @param schema
         lsst.afw.table.Schema for coadd-sources.   
     @param sourceConversionConfig
         lsst.ap.utils.CsvConversionConfig - parameters used for
         C++ to CSV conversion.
     @param asView
         True if the canonical table should be constructed as a VIEW on
         top of the run-specific table.
     @param sourceProcessingConfig
         lsst.ap.cluster.SourceProcessingConfig - parameters used to
         denormalize the C++ schema produced by the pipeline.
     @param slotConfig
         lsst.meas.algorithms.SlotConfig - pipeline slot mappings.
     @param measPrefix
         Prefix for measurement field names.
     """
     # Generate SQL for run specific table
     createStmt, loadStmt = genericTableSql(
         schema,
         sourceConversionConfig,
         _sourceIndexes(sourceProcessingConfig))
     # build substitution parameters for mapping table
     kw = _getMappingKw(
         slotConfig,
         sourceProcessingConfig,
         measPrefix)
     # build selection/output column lists
     selcols = []
     outcols = []
     CoaddName = coaddName[0].upper() + coaddName[1:]
     for runFmt, srcCol in _coaddSourceMappings:
         runCol = runFmt.format(**kw)
         srcCol = srcCol.format(coaddName=coaddName, CoaddName=CoaddName)
         if sourceProcessingConfig.multiBand and srcCol == 'filterId':
             continue # multi-band source has no filterId
         field = _colToField(runCol)
         isFlag = srcCol.startswith('flag')
         if isFlag and not sourceConversionConfig.flagsAsBits:
             continue
         if field in schema or runCol == 'coord_htmId20':
             selcols.append(runCol)
         elif isFlag:
             selcols.append("b'0'")
         else:
             selcols.append('NULL')
         outcols.append(srcCol)
     if not sourceConversionConfig.flagsAsBits:
         # Deal with canonical flags packed into BIGINTs
         n = (len(sourceConversionConfig.canonicalFlags) + 62) / 63
         if n == 1:
             selcols.append('flags')
             outcols.append('flags')
         else:
             for i in xrange(1, n + 1):
                 c = 'flags{}'.format(i)
                 selcols.append(c)
                 outcols.append(c)
     tableName = CoaddName + 'Source'
     runTableName = 'Run' + tableName
     if asView:
         # Replace the official version of <CoaddName>Source with an equivalent VIEW
         sourceStmt = 'CREATE OR REPLACE VIEW {} AS SELECT\n\t'.format(tableName)
         sourceStmt += ',\n\t'.join(a + ' AS ' + b for a,b in zip(selcols, outcols))
         sourceStmt += '\nFROM {};'.format(runTableName)
     else:
         # Use the definition of Source from cat (i.e. the one used by the
         # schema browser for documentation purposes). This should cause
         # ingest to fail if this code and the canonical schema are not in sync.
         sourceStmt = 'INSERT INTO {} (\n\t'.format(tableName)
         sourceStmt += ',\n\t'.join(outcols)
         sourceStmt += ')\nSELECT\n\t'
         sourceStmt += ',\n\t'.join(selcols)
         sourceStmt += '\nFROM {};\n'.format(runTableName)
     return (createStmt.format(tableName=runTableName),
             loadStmt.format(tableName=runTableName, fileName='{fileName}'),
             sourceStmt)
 
# mappings from run-specific table column names to canonical ForcedSource columns

lsst.pex.config.history.format

def format

Definition: history.py:127

lsst.datarel.schema._sourceIndexes

def _sourceIndexes

Definition: schema.py:236

lsst.datarel.schema._getMappingKw

def _getMappingKw

Definition: schema.py:332

lsst.datarel.schema.genericTableSql

def genericTableSql

Definition: schema.py:91

lsst.datarel.schema._colToField

def _colToField

Definition: schema.py:316

def lsst.datarel.schema.forcedSourceTableSql	(	coaddName,
		schema,
		sourceConversionConfig,
		asView,
		sourceProcessingConfig,
		slotConfig,
		measPrefix
	)

Return a tuple of SQL statements (createStmt, loadStmt, sourceStmt)
for a forced source table. The canonical table name is obtained by
capitalizing the first letter of coaddName and appending 'ForcedSource'.
The run specific table name is derived from the former by prepending 'Run'.

createStmt :    CREATE TABLE statement for the Run<CoaddName>ForcedSource
                table, which includes all fields from the run-specific
                lsst.afw.table.Schema for source tables output by the
                pipelines.

loadStmt :      LOAD DATA statement for the Run<CoaddName>ForcedSource
                table.  This is a format string; to generate valid SQL a
                fileName must be supplied, e.g.:

                loadStmt.format(fileName='source.csv')

sourceStmt :    Map the Run<CoaddName>ForcedSource table to the canonical
                <CoaddName>ForcedSource schema. This will either create a
                VIEW, or INSERT into the materialized equivalent.

@param coaddName
    Coadd name (camel-case), e.g. 'deep' or 'goodSeeing'.
@param schema
    lsst.afw.table.Schema for forced sources.   
@param sourceConversionConfig
    lsst.ap.utils.CsvConversionConfig - parameters used for
    C++ to CSV conversion.
@param asView
    True if the canonical table should be constructed as a VIEW on
    top of the run-specific table.
@param sourceProcessingConfig
    lsst.ap.cluster.SourceProcessingConfig - parameters used to
    denormalize the C++ schema produced by the pipeline.
@param slotConfig
    lsst.meas.algorithms.SlotConfig - pipeline slot mappings.
@param measPrefix
    Prefix for measurement field names.

Definition at line 795 of file schema.py.

 
                         measPrefix):
     """Return a tuple of SQL statements (createStmt, loadStmt, sourceStmt)
     for a forced source table. The canonical table name is obtained by
     capitalizing the first letter of coaddName and appending 'ForcedSource'.
     The run specific table name is derived from the former by prepending 'Run'.
 
     createStmt :    CREATE TABLE statement for the Run<CoaddName>ForcedSource
                     table, which includes all fields from the run-specific
                     lsst.afw.table.Schema for source tables output by the
                     pipelines.
 
     loadStmt :      LOAD DATA statement for the Run<CoaddName>ForcedSource
                     table.  This is a format string; to generate valid SQL a
                     fileName must be supplied, e.g.:
 
                     loadStmt.format(fileName='source.csv')
 
     sourceStmt :    Map the Run<CoaddName>ForcedSource table to the canonical
                     <CoaddName>ForcedSource schema. This will either create a
                     VIEW, or INSERT into the materialized equivalent.
 
     @param coaddName
         Coadd name (camel-case), e.g. 'deep' or 'goodSeeing'.
     @param schema
         lsst.afw.table.Schema for forced sources.   
     @param sourceConversionConfig
         lsst.ap.utils.CsvConversionConfig - parameters used for
         C++ to CSV conversion.
     @param asView
         True if the canonical table should be constructed as a VIEW on
         top of the run-specific table.
     @param sourceProcessingConfig
         lsst.ap.cluster.SourceProcessingConfig - parameters used to
         denormalize the C++ schema produced by the pipeline.
     @param slotConfig
         lsst.meas.algorithms.SlotConfig - pipeline slot mappings.
     @param measPrefix
         Prefix for measurement field names.
     """
     # Generate SQL for run specific table
     createStmt, loadStmt = genericTableSql(
         schema,
         sourceConversionConfig,
         _sourceIndexes(sourceProcessingConfig))
     # build substitution parameters for mapping table
     if sourceProcessingConfig.clusterPrefix is None:
         sourceProcessingConfig.clusterPrefix = ""
     kw = _getMappingKw(
         slotConfig,
         sourceProcessingConfig,
         measPrefix)
     # build selection/output column lists
     selcols = []
     outcols = []
     CoaddName = coaddName[0].upper() + coaddName[1:]
     for runFmt, srcCol in _forcedSourceMappings:
         runCol = runFmt.format(**kw)
         srcCol = srcCol.format(coaddName=coaddName, CoaddName=CoaddName)
         if sourceProcessingConfig.multiBand and srcCol == 'filterId':
             continue # multi-band source has no filterId
         field = _colToField(runCol)
         isFlag = srcCol.startswith('flag')
         if isFlag and not sourceConversionConfig.flagsAsBits:
             continue
         if field in schema or runCol == 'coord_htmId20':
             selcols.append(runCol)
         elif isFlag:
             selcols.append("b'0'")
         else:
             selcols.append('NULL')
         outcols.append(srcCol)
     if not sourceConversionConfig.flagsAsBits:
         # Deal with canonical flags packed into BIGINTs
         n = (len(sourceConversionConfig.canonicalFlags) + 62) / 63
         if n == 1:
             selcols.append('flags')
             outcols.append('flags')
         else:
             for i in xrange(1, n + 1):
                 c = 'flags{}'.format(i)
                 selcols.append(c)
                 outcols.append(c)
     tableName = CoaddName + 'ForcedSource'
     runTableName = 'Run' + tableName
     if asView:
         # Replace the official version of <CoaddName>ForcedSource with an equivalent VIEW
         sourceStmt = 'CREATE OR REPLACE VIEW {} AS SELECT\n\t'.format(tableName)
         sourceStmt += ',\n\t'.join(a + ' AS ' + b for a,b in zip(selcols, outcols))
         sourceStmt += '\nFROM {};'.format(runTableName)
     else:
         # Use the definition of Source from cat (i.e. the one used by the
         # schema browser for documentation purposes). This should cause
         # ingest to fail if this code and the canonical schema are not in sync.
         sourceStmt = 'INSERT INTO {} (\n\t'.format(tableName)
         sourceStmt += ',\n\t'.join(outcols)
         sourceStmt += ')\nSELECT\n\t'
         sourceStmt += ',\n\t'.join(selcols)
         sourceStmt += '\nFROM {};\n'.format(runTableName)
     return (createStmt.format(tableName=runTableName),
             loadStmt.format(tableName=runTableName, fileName='{fileName}'),
             sourceStmt)

def lsst.datarel.schema.genericTableSql	(	schema,
		csvConversionConfig,
		indexedFields
	)

Return a pair of SQL template strings (createStmt, loadStmt).

createStmt : a format string for the CREATE TABLE statement corresponding
             to the given schema and desired indexes. To generate valid
             SQL, tableName must be supplied, e.g.:

             str.format(create, tableName='MyTable')

loadStmt   : a format string for the corresponding LOAD DATA statement.
             To generate valid SQL, tableName and fileName must be supplied,
             e.g.:

             str.format(load, tableName='MyTable', fileName='MyTable.csv')

Note that the generated LOAD statement will never REPLACE data, and assumes
that CSV files conform to the format returned by makeMysqlCsvConfig().

@param schema               lsst.afw.table.Schema describing the C++ table
                            to map to a MySQL database table.
@param csvConversionConfig  lsst.ap.utils.CsvConversionConfig describing
                            the C++ table to CSV file conversion options. 
@param indexedFields        List or set of C++ field names to create indexes on

Definition at line 91 of file schema.py.

 
 def genericTableSql(schema, csvConversionConfig, indexedFields):
     """Return a pair of SQL template strings (createStmt, loadStmt).
 
     createStmt : a format string for the CREATE TABLE statement corresponding
                  to the given schema and desired indexes. To generate valid
                  SQL, tableName must be supplied, e.g.:
 
                  str.format(create, tableName='MyTable')
 
     loadStmt   : a format string for the corresponding LOAD DATA statement.
                  To generate valid SQL, tableName and fileName must be supplied,
                  e.g.:
 
                  str.format(load, tableName='MyTable', fileName='MyTable.csv')
 
     Note that the generated LOAD statement will never REPLACE data, and assumes
     that CSV files conform to the format returned by makeMysqlCsvConfig().
 
     @param schema               lsst.afw.table.Schema describing the C++ table
                                 to map to a MySQL database table.
     @param csvConversionConfig  lsst.ap.utils.CsvConversionConfig describing
                                 the C++ table to CSV file conversion options. 
     @param indexedFields        List or set of C++ field names to create indexes on
     """
     dbkeys = []
     coldefs = []
     columns = []
     setexprs = []
 
     def _append(dbcol, dbty, suffixes):
         for suffix in suffixes:
             coldefs.append(str.format('{}{} {} NULL', dbcol, suffix, dbty))
             columns.append(dbcol + suffix)
 
     for item in schema.asList():
         name = item.field.getName()
         #replace all non-word characters with underscore
         dbcol = re.sub('[\W]','_',name)
         ty = item.key.getTypeString()
         if ty in _dbType:
             dbty = _dbType[ty]
             constraint = 'NULL'
             if name == 'id':
                 dbkeys.append(_pk(dbcol))
                 constraint = 'NOT NULL'
             elif ty == 'Flag':
                 if not csvConversionConfig.flagsAsBits:
                     continue # we will deal with flags later
                 constraint = 'NOT NULL'
             elif ty == 'I' or ty == 'L':
                 if name in csvConversionConfig.nullableIntegers:
                     constraint = 'NULL'
                 else:
                     constraint = 'NOT NULL'
             else:
                 constraint = 'NULL'
             coldefs.append(' '.join([dbcol, dbty, constraint]))
             if ty == 'Flag':
                 columns.append('@' + dbcol)
                 setexprs.append(str.format('{0} = CAST(@{0} AS UNSIGNED)', dbcol))
             else: 
                 columns.append(dbcol)
             if name != 'id' and name in indexedFields:
                 dbkeys.append(_k(dbcol))
         elif ty == 'Coord':
             if name == "coord":
                 # the Coord slot field
                 coldefs.append('coord_ra DOUBLE NULL')
                 coldefs.append('coord_decl DOUBLE NULL')
                 coldefs.append('coord_htmId20 BIGINT NULL')
                 columns.append('coord_ra')
                 columns.append('coord_decl')
                 setexprs.append('coord_htmId20 = scisql_s2HtmId(coord_ra, coord_decl, 20)')
                 dbkeys.append(_k('coord_htmId20'))
                 dbkeys.append(_k('coord_decl'))
             else:
                  _append(dbcol, 'DOUBLE', ['_ra', '_decl'])
         elif ty == 'ArrayF' or ty == 'ArrayD':
             dbty = _dbType[ty[-1]]
             for i in xrange(1, item.key.getSize() + 1):
                 coldefs.append(str.format('{}_{} {} NULL', dbcol, i, dbty))
                 columns.append(str.format('{}_{}', dbcol, i))
         elif ty == 'PointI' or ty == 'PointF' or ty == 'PointD':
             dbty = _dbType[ty[-1]]
             _append(dbcol, dbty, ['_x', '_y'])
         elif ty == 'MomentsF' or ty == 'MomentsD':
             dbty = _dbType[ty[-1]]
             _append(dbcol, dbty, ['_Ixx', '_Iyy', '_Ixy'])
         elif ty == 'CovF' or ty == 'CovD':
             dbty = _dbType[ty[-1]]
             sz = item.key.getSize()
             for i in xrange(1, sz + 1):
                 for j in xrange(i, sz + 1):
                     coldefs.append(str.format('{}_{}_{} {} NULL', dbcol, i, j, dbty))
                     columns.append(str.format('{}_{}_{}', dbcol, i, j))
         elif ty == 'CovPointF' or ty == 'CovPointD':
             dbty = _dbType[ty[-1]]
             if name.endswith('.err'):
                 dbcol = dbcol[:-4]
                 if item.field.getUnits() == 'rad^2':
                     # HACK: this is a coordinate covariance matrix
                     _append(dbcol, dbty, ['_raVar', '_radeclCov',
                                                       '_declVar'])
                     continue
             _append(dbcol, dbty, ['_xVar', '_xyCov',
                                             '_yVar'])
         elif ty == 'CovMomentsF' or ty == 'CovMomentsD':
             dbty = _dbType[ty[-1]]
             if name.endswith('.err'):
                 dbcol = dbcol[:-4]
             _append(dbcol, dbty, ['_IxxVar', '_IxxIyyCov', '_IxxIxyCov',
                                                 '_IyyVar', '_IyyIxyCov',
                                                               '_IxyVar'])
         else:
             raise RuntimeError(ty + ' is not a recognized AFW field type string!')
     if not csvConversionConfig.flagsAsBits:
         # add BIGINT flag columns
         n = (schema.getFlagFieldCount() + 62) / 63
         for i in xrange(1, n + 1):
             coldefs.append(str.format('runFlags{} BIGINT NOT NULL', i))
             columns.append(str.format('runFlags{}', i))
         # add BIGINT flag columns for canonical flags in canonical order
         n = (len(csvConversionConfig.canonicalFlags) + 62) / 63
         for i in xrange(1, n + 1):
             coldefs.append(str.format('flags{} BIGINT NOT NULL', i))
             columns.append(str.format('flags{}', i))
     # Finally, create schema SQL and LOAD DATA templates
     createStmt = 'CREATE TABLE IF NOT EXISTS {tableName} (\n\t'
     createStmt += ',\n\t'.join(coldefs + dbkeys)
     createStmt += '\n) ENGINE=MyISAM;\n'
 
     loadStmt = ("LOAD DATA LOCAL INFILE '{fileName}'\n"
                 "\tINTO TABLE {tableName}\n"
                 "\tFIELDS TERMINATED BY ','\n"
                 "(\n\t")
     loadStmt += ',\n\t'.join(columns)
     if len(setexprs) == 0:
         loadStmt += '\n);'
     else:
         loadStmt += '\n) SET\n\t'
         loadStmt += ',\n\t'.join(setexprs)
         loadStmt += ';'
     return createStmt, loadStmt
 

lsst.datarel.schema._pk

def _pk

Definition: schema.py:46

lsst.datarel.schema.genericTableSql

def genericTableSql

Definition: schema.py:91

lsst.datarel.schema._k

def _k

Definition: schema.py:51

def lsst.datarel.schema.makeMysqlCsvConfig ( )

Return the lsst.ap.utils.CsvConfig to use when writing out CSV files
that must be loaded into MySQL.

Definition at line 60 of file schema.py.

 
 def makeMysqlCsvConfig():
     """Return the lsst.ap.utils.CsvConfig to use when writing out CSV files
     that must be loaded into MySQL.
     """
     cfg = lsst.ap.utils.CsvConfig()
     cfg.quoting = 'QUOTE_NONE' # C++ tables cannot contain strings (yet)
     cfg.delimiter = ','
     cfg.escapeChar = '\\'
     cfg.quoteChar = ''
     cfg.skipInitialSpace = False
     cfg.doubleQuote = False
     cfg.standardEscapes = True
     cfg.trailingDelimiter = False
     cfg.nonfiniteAsNull = True
     return cfg
 

lsst.datarel.schema.makeMysqlCsvConfig

def makeMysqlCsvConfig

Definition: schema.py:60

def lsst.datarel.schema.objectTableSql	(	schema,
		dbMappingConfig,
		sourceAssocConfig,
		filters
	)

Return a tuple of SQL statements (createStmt, loadStmt, objectStmt)
for the Object table.

createStmt :    CREATE TABLE statement for the RunObject table, which
                includes all fields from the run-specific
                lsst.afw.table.Schema for source cluster tables output
                by the SourceAssoc pipeline.

loadStmt :      LOAD DATA statement for the RunObject table. This is
                a format string; to generate valid SQL a fileName must
                be supplied, e.g.:

                loadStmt.format(fileName='object.csv')

objectStmt :    Map the RunObject table to the canonical Object schema.
                This will either create a VIEW, or INSERT into its
                materialized equivalent.

@param schema               lsst.afw.table.Schema for objects (source clusters)
@param dbMappingConfig      lsst.datarel.DbMappingConfig
@param sourceAssocConfig    lsst.ap.tasks.sourceAssoc.SourceAssocConfig
@param filters              Iterable over the filter names included in the
                            canonical Object table.

Definition at line 473 of file schema.py.

 
 def objectTableSql(schema, dbMappingConfig, sourceAssocConfig, filters):
     """Return a tuple of SQL statements (createStmt, loadStmt, objectStmt)
     for the Object table.
 
     createStmt :    CREATE TABLE statement for the RunObject table, which
                     includes all fields from the run-specific
                     lsst.afw.table.Schema for source cluster tables output
                     by the SourceAssoc pipeline.
 
     loadStmt :      LOAD DATA statement for the RunObject table. This is
                     a format string; to generate valid SQL a fileName must
                     be supplied, e.g.:
 
                     loadStmt.format(fileName='object.csv')
 
     objectStmt :    Map the RunObject table to the canonical Object schema.
                     This will either create a VIEW, or INSERT into its
                     materialized equivalent.
 
     @param schema               lsst.afw.table.Schema for objects (source clusters)
     @param dbMappingConfig      lsst.datarel.DbMappingConfig
     @param sourceAssocConfig    lsst.ap.tasks.sourceAssoc.SourceAssocConfig
     @param filters              Iterable over the filter names included in the
                                 canonical Object table.
     """
     # Generate SQL for run specific table
     createStmt, loadStmt = genericTableSql(
         schema, dbMappingConfig.objectConversion, set())
     # build substitution parameters for mapping table
     kw = _getMappingKw(
         sourceAssocConfig.measSlots,
         sourceAssocConfig.sourceProcessing,
         sourceAssocConfig.measPrefix)
     # build selection/output column lists
     selcols = []
     outcols = []
     for runFmt, objCol in _objectMappings:
         runCol = runFmt.format(**kw)
         field = _colToField(runCol)
         isFlag = objCol.startswith('flag')
         if isFlag and not dbMappingConfig.objectConversion.flagsAsBits:
             continue
         if field in schema or runCol == 'coord_htmId20':
             selcols.append(runCol)
         elif isFlag:
             selcols.append("b'0'")
         else:
             selcols.append('NULL')
         outcols.append(objCol)
     for filter in filters:
         kw['filter'] = filter
         for runFmt, objFmt in _filterMappings:
             runCol = runFmt.format(**kw)
             objCol = objFmt.format(filter=filter)
             field = _colToField(runCol)
             isFlag = objCol.startswith('flag')
             if isFlag and not dbMappingConfig.objectConversion.flagsAsBits:
                 continue
             if field in schema:
                 selcols.append(runCol)
             elif isFlag:
                 selcols.append("b'0'")
             else:
                 selcols.append('NULL')
             outcols.append(objCol)
     if not dbMappingConfig.objectConversion.flagsAsBits:
         # Deal with canonical flags packed into BIGINTs
         n = (len(dbMappingConfig.objectConversion.canonicalFlags) + 62) / 63
         if n == 1:
             selcols.append('flags')
             outcols.append('flags')
         else:
             for i in xrange(1, n + 1):
                 c = 'flags{}'.format(i)
                 selcols.append(c)
                 outcols.append(c)
     if dbMappingConfig.asView:
         # Replace the official version of Object with an equivalent VIEW
         objectStmt = 'CREATE OR REPLACE VIEW Object AS SELECT\n\t'
         objectStmt += ',\n\t'.join(a + ' AS ' + b for a,b in zip(selcols, outcols))
         objectStmt += '\nFROM RunObject;'
     else:
         # Use the definition of Object from cat (i.e. the one used by the
         # schema browser for documentation purposes). This should cause
         # ingest to fail if this code and the canonical schema are not in sync.
         objectStmt = 'INSERT INTO Object (\n\t'
         objectStmt += ',\n\t'.join(outcols)
         objectStmt += ')\nSELECT\n\t'
         objectStmt += ',\n\t'.join(selcols)
         objectStmt += '\nFROM RunObject;'
     return (createStmt.format(tableName='RunObject'),
             loadStmt.format(tableName='RunObject', fileName='{fileName}'),
             objectStmt)
 

lsst.pex.config.history.format

def format

Definition: history.py:127

lsst.datarel.schema._getMappingKw

def _getMappingKw

Definition: schema.py:332

lsst.datarel.schema.genericTableSql

def genericTableSql

Definition: schema.py:91

lsst.datarel.schema.objectTableSql

def objectTableSql

Definition: schema.py:473

lsst.datarel.schema._colToField

def _colToField

Definition: schema.py:316

def lsst.datarel.schema.sourceTableSql	(	schema,
		dbMappingConfig,
		sourceAssocConfig
	)

Return a tuple of SQL statements (createStmt, loadStmt, sourceStmt)
for the Source table.

createStmt :    CREATE TABLE statement for the RunSource table, which
                includes all fields from the run-specific
                lsst.afw.table.Schema for source tables output by the
                pipelines.

loadStmt :      LOAD DATA statement for the RunSource table. This is
                a format string; to generate valid SQL a fileName must
                be supplied, e.g.:

                loadStmt.format(fileName='source.csv')

sourceStmt :    Map the RunSource table to the canonical Source schema.
                This will either create a VIEW, or INSERT into the
                materialized equivalent.

@param schema               lsst.afw.table.Schema for sources
@param dbMappingConfig      lsst.datarel.DbMappingConfig
@param sourceAssocConfig    lsst.ap.tasks.sourceAssoc.SourceAssocConfig

Definition at line 347 of file schema.py.

 
 def sourceTableSql(schema, dbMappingConfig, sourceAssocConfig):
     """Return a tuple of SQL statements (createStmt, loadStmt, sourceStmt)
     for the Source table.
 
     createStmt :    CREATE TABLE statement for the RunSource table, which
                     includes all fields from the run-specific
                     lsst.afw.table.Schema for source tables output by the
                     pipelines.
 
     loadStmt :      LOAD DATA statement for the RunSource table. This is
                     a format string; to generate valid SQL a fileName must
                     be supplied, e.g.:
 
                     loadStmt.format(fileName='source.csv')
 
     sourceStmt :    Map the RunSource table to the canonical Source schema.
                     This will either create a VIEW, or INSERT into the
                     materialized equivalent.
 
     @param schema               lsst.afw.table.Schema for sources
     @param dbMappingConfig      lsst.datarel.DbMappingConfig
     @param sourceAssocConfig    lsst.ap.tasks.sourceAssoc.SourceAssocConfig
     """
     # Generate SQL for run specific table
     createStmt, loadStmt = genericTableSql(
         schema,
         dbMappingConfig.sourceConversion,
         _sourceIndexes(sourceAssocConfig.sourceProcessing))
     # build substitution parameters for mapping table
     kw = _getMappingKw(
         sourceAssocConfig.measSlots,
         sourceAssocConfig.sourceProcessing,
         sourceAssocConfig.measPrefix)
     # build selection/output column lists
     selcols = []
     outcols = []
     for runFmt, srcCol in _sourceMappings:
         runCol = runFmt.format(**kw)
         field = _colToField(runCol)
         isFlag = srcCol.startswith('flag')
         if isFlag and not dbMappingConfig.sourceConversion.flagsAsBits:
             continue
         if field in schema or runCol == 'coord_htmId20':
             selcols.append(runCol)
         elif isFlag:
             selcols.append("b'0'")
         else:
             selcols.append('NULL')
         outcols.append(srcCol)
     if not dbMappingConfig.sourceConversion.flagsAsBits:
         # Deal with canonical flags packed into BIGINTs
         n = (len(dbMappingConfig.sourceConversion.canonicalFlags) + 62) / 63
         if n == 1:
             selcols.append('flags')
             outcols.append('flags')
         else:
             for i in xrange(1, n + 1):
                 c = 'flags{}'.format(i)
                 selcols.append(c)
                 outcols.append(c)
     if dbMappingConfig.asView:
         # Replace the official version of Source with an equivalent VIEW
         sourceStmt = 'CREATE OR REPLACE VIEW Source AS SELECT\n\t'
         sourceStmt += ',\n\t'.join(a + ' AS ' + b for a,b in zip(selcols, outcols))
         sourceStmt += '\nFROM RunSource;'
     else:
         # Use the definition of Source from cat (i.e. the one used by the
         # schema browser for documentation purposes). This should cause
         # ingest to fail if this code and the canonical schema are not in sync.
         sourceStmt = 'INSERT INTO Source (\n\t'
         sourceStmt += ',\n\t'.join(outcols)
         sourceStmt += ')\nSELECT\n\t'
         sourceStmt += ',\n\t'.join(selcols)
         sourceStmt += '\nFROM RunSource;\n'
     return (createStmt.format(tableName='RunSource'),
             loadStmt.format(tableName='RunSource', fileName='{fileName}'),
             sourceStmt) 

lsst.pex.config.history.format

def format

Definition: history.py:127

lsst.datarel.schema.sourceTableSql

def sourceTableSql

Definition: schema.py:347

lsst.datarel.schema._sourceIndexes

def _sourceIndexes

Definition: schema.py:236

lsst.datarel.schema._getMappingKw

def _getMappingKw

Definition: schema.py:332

lsst.datarel.schema.genericTableSql

def genericTableSql

Definition: schema.py:91

lsst.datarel.schema._colToField

def _colToField

Definition: schema.py:316

list lsst.datarel.schema.__all__

Initial value:

 = ['makeMysqlCsvConfig',
            'DbMappingConfig',
            'genericTableSql',
            'sourceTableSql',
            'objectTableSql',
            'coaddSourceTableSql',
           ]

Definition at line 29 of file schema.py.

list lsst.datarel.schema._coaddSourceMappings

Definition at line 568 of file schema.py.

dictionary lsst.datarel.schema._dbType

Initial value:

 = {
     'I': 'INTEGER',
     'L': 'BIGINT',
     'F': 'FLOAT',
     'D': 'DOUBLE',
     'Angle': 'DOUBLE',
     'Flag': 'BIT(1)',
 }

Definition at line 37 of file schema.py.

list lsst.datarel.schema._filterMappings

Initial value:

 = [
     ("{filter}_obs_count", "{filter}ObsCount"),
     ("{filter}_obs_time_min", "{filter}ObsTimeMin"),
     ("{filter}_obs_time_max", "{filter}ObsTimeMax"),
     ("{filter}_{measPrefix}{psfFlux}", "{filter}PsfFlux"),
     ("{filter}_{measPrefix}{psfFlux}_err", "{filter}PsfFluxSigma"),
     ("{filter}_{measPrefix}{psfFlux}_count", "{filter}PsfFluxCount"),
     ("{filter}_{measPrefix}{apFlux}", "{filter}ApFlux"),
     ("{filter}_{measPrefix}{apFlux}_err", "{filter}ApFluxSigma"),
     ("{filter}_{measPrefix}{apFlux}_count", "{filter}ApFluxCount"),
     ("{filter}_{measPrefix}{modelFlux}", "{filter}ModelFlux"),
     ("{filter}_{measPrefix}{modelFlux}_err", "{filter}ModelFluxSigma"),
     ("{filter}_{measPrefix}{modelFlux}_count", "{filter}ModelFluxCount"),
     ("{filter}_{measPrefix}{instFlux}", "{filter}InstFlux"),
     ("{filter}_{measPrefix}{instFlux}_err", "{filter}InstFluxSigma"),
     ("{filter}_{measPrefix}{instFlux}_count", "{filter}InstFluxCount"),
     ("{filter}_{measPrefix}{shape}_Ixx", "{filter}ShapeIxx"),
     ("{filter}_{measPrefix}{shape}_Iyy", "{filter}ShapeIyy"),
     ("{filter}_{measPrefix}{shape}_Ixy", "{filter}ShapeIxy"),
     ("{filter}_{measPrefix}{shape}_IxxVar", "{filter}ShapeIxxVar"),
     ("{filter}_{measPrefix}{shape}_IyyVar", "{filter}ShapeIyyVar"),
     ("{filter}_{measPrefix}{shape}_IxyVar", "{filter}ShapeIxyVar"),
     ("{filter}_{measPrefix}{shape}_IxxIyyCov", "{filter}ShapeIxxIyyCov"),
     ("{filter}_{measPrefix}{shape}_IxxIxyCov", "{filter}ShapeIxxIxyCov"),
     ("{filter}_{measPrefix}{shape}_IyyIxyCov", "{filter}ShapeIyyIxyCov"),
     ("{filter}_{measPrefix}{shape}_count", "{filter}ShapeCount"),
 ]

Definition at line 445 of file schema.py.

list lsst.datarel.schema._forcedSourceMappings

Definition at line 731 of file schema.py.

list lsst.datarel.schema._objectMappings

Initial value:

 = [
     ("id", "objectId"),
     ("coord_ra", "ra"),
     ("coord_decl", "decl"),
     ("coord_raVar", "raVar"),
     ("coord_declVar", "declVar"),
     ("coord_radeclCov", "radeclCov"),
     ("coord_htmId20", "htmId20"),
     ("coord_weightedmean_ra", "wmRa"),
     ("coord_weightedmean_decl", "wmDecl"),
     ("coord_weightedmean_raVar", "wmRaVar"),
     ("coord_weightedmean_declVar", "wmDeclVar"),
     ("coord_weightedmean_radeclCov", "wmRadeclCov"),
     ("obs_count", "obsCount"),
     ("obs_time_min", "obsTimeMin"),
     ("obs_time_max", "obsTimeMax"),
     ("obs_time_mean", "obsTimeMean"),
     ("flag_noise", "flagNoise"),
 ]

Definition at line 425 of file schema.py.

list lsst.datarel.schema._sourceMappings

Definition at line 255 of file schema.py.

Classes

Functions

Variables

Function Documentation

Variable Documentation

Functions
def	_pk

def	_k

def	makeMysqlCsvConfig

def	genericTableSql

def	_sourceIndexes

def	_colToField

def	_getMappingKw

def	sourceTableSql

def	objectTableSql

def	coaddSourceTableSql

def	forcedSourceTableSql

Variables
list	__all__

dictionary	_dbType

list	_sourceMappings

list	_objectMappings

list	_filterMappings

list	_coaddSourceMappings

list	_forcedSourceMappings

Classes
class	DbMappingConfig