Source code for lsst.sims.maf.metricBundles.moMetricBundle

from __future__ import print_function
from builtins import object
import os
import warnings
import numpy as np
import numpy.ma as ma
import matplotlib.pyplot as plt

from lsst.sims.maf.metrics import BaseMoMetric
from lsst.sims.maf.metrics import MoCompletenessMetric, ValueAtHMetric
from lsst.sims.maf.slicers import MoObjSlicer
from lsst.sims.maf.stackers import BaseMoStacker, MoMagStacker
from lsst.sims.maf.plots import PlotHandler
from lsst.sims.maf.plots import MetricVsH

from .metricBundle import MetricBundle

__all__ = ['MoMetricBundle', 'MoMetricBundleGroup', 'createEmptyMoMetricBundle', 'makeCompletenessBundle']


[docs]def createEmptyMoMetricBundle(): """Create an empty metric bundle. Returns ------- ~lsst.sims.maf.metricBundles.MoMetricBundle An empty metric bundle, configured with just the :class:`BaseMetric` and :class:`BaseSlicer`. """ return MoMetricBundle(BaseMoMetric(), MoObjSlicer(), None)
[docs]def makeCompletenessBundle(bundle, summaryName='CumulativeCompleteness', Hmark=None, resultsDb=None): """ Make a mock metric bundle from a bundle which had MoCompleteness or MoCumulativeCompleteness summary metrics run. This lets us use the plotHandler + plots.MetricVsH to generate plots. Parameters ---------- bundle : ~lsst.sims.maf.metricBundles.MetricBundle The metric bundle with a completeness summary statistic. summaryName : str, opt The name of the summary statistic. Default "CumulativeCompleteness". Hmark : float, opt The Hmark value to add to the plotting dictionary of the new mock bundle. Default None. resultsDb : ~lsst.sims.maf.db.ResultsDb, opt The resultsDb in which to record the summary statistic value at Hmark. Default None. Returns ------- ~lsst.sims.maf.metricBundles.MoMetricBundle """ # First look for summary value: try: bundle.summaryValues[summaryName] # If not found, then just run it (assuming it's completeness metric). except (TypeError, KeyError): if summaryName == 'DifferentialCompleteness': metric = MoCompletenessMetric(cumulative=False) else: metric = MoCompletenessMetric(cumulative=True) bundle.setSummaryMetrics(metric) bundle.computeSummaryStats(resultsDb) # Make up the bundle, including the metric values. completeness = ma.MaskedArray(data=bundle.summaryValues[summaryName]['value'], mask=np.zeros(len(bundle.summaryValues[summaryName]['value'])), fill_value=0) mb = MoMetricBundle(MoCompletenessMetric(metricName=summaryName), bundle.slicer, constraint=bundle.constraint, runName=bundle.runName, metadata=bundle.metadata) plotDict = {} plotDict.update(bundle.plotDict) plotDict['label'] = bundle.metadata mb.metricValues = completeness.reshape(1, len(completeness)) if Hmark is not None: metric = ValueAtHMetric(Hmark=Hmark) mb.setSummaryMetrics(metric) mb.computeSummaryStats(resultsDb) val = mb.summaryValues['Value At H=%.1f' % Hmark] if summaryName == 'CumulativeCompleteness': plotDict['label'] += ' : @ H(<=%.1f) = %.1f%s' % (Hmark, val * 100, '%') else: plotDict['label'] += ' : @ H(=%.1f) = %.1f%s' % (Hmark, val * 100, '%') mb.setPlotDict(plotDict) return mb
[docs]class MoMetricBundle(MetricBundle): def __init__(self, metric, slicer, constraint=None, stackerList=None, runName='opsim', metadata=None, fileRoot=None, plotDict=None, plotFuncs=None, displayDict=None, childMetrics=None, summaryMetrics=None): """ Instantiate moving object metric bundle, save metric/slicer/constraint, etc. """ self.metric = metric self.slicer = slicer if constraint == '': constraint = None self.constraint = constraint # Set the stackerlist. if stackerList is not None: if isinstance(stackerList, BaseMoStacker): self.stackerList = [stackerList, ] else: self.stackerList = [] for s in stackerList: if not isinstance(s, BaseMoStacker): raise ValueError('stackerList must only contain ' 'lsst.sims.maf.stackers.BaseMoStacker type objs') self.stackerList.append(s) else: self.stackerList = [] # Add the basic 'visibility/mag' stacker if not present. magStackerFound = False for s in self.stackerList: if s.__class__.__name__ == 'MoMagStacker': magStackerFound = True break if not magStackerFound: self.stackerList.append(MoMagStacker()) # Set a mapsList just for compatibility with generic MetricBundle. self.mapsList = [] # Add the summary stats, if applicable. self.setSummaryMetrics(summaryMetrics) # Set the provenance/metadata. self.runName = runName self._buildMetadata(metadata) # Build the output filename root if not provided. if fileRoot is not None: self.fileRoot = fileRoot else: self._buildFileRoot() # Set the plotting classes/functions. self.setPlotFuncs(plotFuncs) # Set the plotDict and displayDicts. self.plotDict = {'units': '@H'} self.setPlotDict(plotDict) # Update/set displayDict. self.displayDict = {} self.setDisplayDict(displayDict) # Set the list of child metrics. self.setChildBundles(childMetrics) # This is where we store the metric values and summary stats. self.metricValues = None self.summaryValues = None def _resetMetricBundle(self): """Reset all properties of MetricBundle. """ self.metric = None self.slicer = None self.constraint = None self.stackerList = [MoMagStacker()] self.mapsList = [] self.summaryMetrics = [] self.plotFuncs = [] self.runName = 'opsim' self.metadata = '' self.dbCols = None self.fileRoot = None self.plotDict = {} self.displayDict = {} self.childMetrics = None self.metricValues = None self.summaryValues = None def _buildMetadata(self, metadata): """If no metadata is provided, auto-generate it from the obsFile + constraint. """ if metadata is None: try: self.metadata = self.slicer.obsfile.replace('.txt', '').replace('.dat', '') self.metadata = self.metadata.replace('_obs', '').replace('_allObs', '') except AttributeError: self.metadata = 'noObs' # And modify by constraint. if self.constraint is not None: self.metadata += ' ' + self.constraint else: self.metadata = metadata def _findReqCols(self): # Doesn't quite work the same way yet. No stacker list, for example. raise NotImplementedError
[docs] def setChildBundles(self, childMetrics=None): """ Identify any child metrics to be run on this (parent) bundle. and create the new metric bundles that will hold the child values, linking to this bundle. Remove the summaryMetrics from self afterwards. """ self.childBundles = {} if childMetrics is None: childMetrics = self.metric.childMetrics for cName, cMetric in childMetrics.items(): cBundle = MoMetricBundle(metric=cMetric, slicer=self.slicer, constraint=self.constraint, stackerList=self.stackerList, runName=self.runName, metadata=self.metadata, plotDict=self.plotDict, plotFuncs=self.plotFuncs, displayDict=self.displayDict, summaryMetrics=self.summaryMetrics) self.childBundles[cName] = cBundle if len(childMetrics) > 0: self.summaryMetrics = []
[docs] def computeSummaryStats(self, resultsDb=None): """ Compute summary statistics on metricValues, using summaryMetrics, for self and child bundles. """ if self.summaryValues is None: self.summaryValues = {} if self.summaryMetrics is not None: # Build array of metric values, to use for (most) summary statistics. for m in self.summaryMetrics: summaryName = m.name summaryVal = m.run(self.metricValues, self.slicer.slicePoints['H']) self.summaryValues[summaryName] = summaryVal # Add summary metric info to results database, if applicable. if resultsDb: metricId = resultsDb.updateMetric(self.metric.name, self.slicer.slicerName, self.runName, self.constraint, self.metadata, None) resultsDb.updateSummaryStat(metricId, summaryName=summaryName, summaryValue=summaryVal)
[docs] def reduceMetric(self, reduceFunc, reducePlotDict=None, reduceDisplayDict=None): raise NotImplementedError
[docs] def read(self, filename): "Read metric data back into a metricBundle, as best as possible." if not os.path.isfile(filename): raise IOError('%s not found' % filename) self._resetMetricBundle() # Must read the data using a moving object slicer. slicer = MoObjSlicer() self.metricValues, self.slicer = slicer.readData(filename) # It's difficult to reinstantiate the metric object, as we don't # know what it is necessarily -- the metricName can be changed. self.metric = BaseMoMetric() # But, for plot label building, we do need to try to recreate the # metric name and units. We can't really do that yet - need more infrastructure. self.metric.name = '' self.constraint = None self.metadata = None path, head = os.path.split(filename) self.fileRoot = head.replace('.h5', '') self.setPlotFuncs([MetricVsH()])
[docs]class MoMetricBundleGroup(object): def __init__(self, bundleDict, outDir='.', resultsDb=None, verbose=True): self.verbose = verbose self.bundleDict = bundleDict self.outDir = outDir if not os.path.isdir(self.outDir): os.makedirs(self.outDir) self.resultsDb = resultsDb self.slicer = list(self.bundleDict.values())[0].slicer for b in self.bundleDict.values(): if b.slicer != self.slicer: raise ValueError('Currently, the slicers for the MoMetricBundleGroup must be equal,' ' using the same observations and Hvals.') self.constraints = list(set([b.constraint for b in bundleDict.values()])) def _checkCompatible(self, metricBundle1, metricBundle2): """Check if two MetricBundles are "compatible". Compatible indicates that the constraints, the slicers, and the maps are the same, and that the stackers do not interfere with each other (i.e. are not trying to set the same column in different ways). Returns True if the MetricBundles are compatible, False if not. Parameters ---------- metricBundle1 : MetricBundle metricBundle2 : MetricBundle Returns ------- bool """ if metricBundle1.constraint != metricBundle2.constraint: return False if metricBundle1.slicer != metricBundle2.slicer: return False if metricBundle1.mapsList.sort() != metricBundle2.mapsList.sort(): return False for stacker in metricBundle1.stackerList: for stacker2 in metricBundle2.stackerList: # If the stackers have different names, that's OK, and if they are identical, that's ok. if (stacker.__class__.__name__ == stacker2.__class__.__name__) & (stacker != stacker2): return False # But if we got this far, everything matches. return True def _findCompatible(self, testKeys): """"Private utility to find which metricBundles with keys in the list 'testKeys' can be calculated at the same time -- having the same slicer, constraint, maps, and compatible stackers. Parameters ----------- testKeys : list List of the dictionary keys (of self.bundleDict) to test for compatibilility. Returns -------- list of lists Returns testKeys, split into separate lists of compatible metricBundles. """ compatibleLists = [] for k in testKeys: try: b = self.bundleDict[k] except KeyError: warnings.warn('Received %s in testkeys, but this is not present in self.bundleDict.' 'Will continue, but this is not expected.') continue foundCompatible = False checkedAll = False while not(foundCompatible) and not(checkedAll): # Go through the existing lists in compatibleLists, to see if this metricBundle matches. for compatibleList in compatibleLists: # Compare to all the metricBundles in this subset, to check all stackers are compatible. foundCompatible = True for comparisonKey in compatibleList: compatible = self._checkCompatible(self.bundleDict[comparisonKey], b) if not compatible: # Found a metricBundle which is not compatible, so stop and go onto the next subset. foundCompatible = False break checkedAll = True if foundCompatible: compatibleList.append(k) else: compatibleLists.append([k,]) return compatibleLists
[docs] def runConstraint(self, constraint): """Calculate the metric values for all the metricBundles which match this constraint in the metricBundleGroup. Also calculates child metrics and summary statistics, and writes all to disk. (work is actually done in _runCompatible, so that only completely compatible sets of metricBundles run at the same time). Parameters ---------- constraint : str SQL-where or pandas constraint for the metricBundles. """ # Find the dict keys of the bundles which match this constraint. keysMatchingConstraint = [] for k, b in self.bundleDict.items(): if b.constraint == constraint: keysMatchingConstraint.append(k) if len(keysMatchingConstraint) == 0: return # Identify the observations which are relevant for this constraint. # This sets slicer.obs (valid for all H values). self.slicer.subsetObs(constraint) # Identify the sets of these metricBundles can be run at the same time (also have the same stackers). compatibleLists = self._findCompatible(keysMatchingConstraint) # And now run each of those subsets of compatible metricBundles. for compatibleList in compatibleLists: self._runCompatible(compatibleList)
def _runCompatible(self, compatibleList): """Calculate the metric values for set of (parent and child) bundles, as well as the summary stats, and write to disk. Parameters ----------- compatibleList : list List of dictionary keys, of the metricBundles which can be calculated together. This means they are 'compatible' and have the same slicer, constraint, and non-conflicting mappers and stackers. """ if self.verbose: print('Running metrics %s' % compatibleList) bDict = self.bundleDict # {key: self.bundleDict.get(key) for key in compatibleList} # Find the unique stackers and maps. These are already "compatible" (as id'd by compatibleList). uniqStackers = [] allStackers = [] uniqMaps = [] allMaps = [] for b in bDict.values(): allStackers += b.stackerList allMaps += b.mapsList for s in allStackers: if s not in uniqStackers: uniqStackers.append(s) for m in allMaps: if m not in uniqMaps: uniqMaps.append(m) if len(uniqMaps) > 0: print("Got some maps .. that was unexpected at the moment. Can't use them here yet.") # Set up all of the metric values, including for the child bundles. for k in compatibleList: b = self.bundleDict[k] b._setupMetricValues() for cb in b.childBundles.values(): cb._setupMetricValues() # Calculate the metric values. for i, slicePoint in enumerate(self.slicer): ssoObs = slicePoint['obs'] for j, Hval in enumerate(slicePoint['Hvals']): # Run stackers to add extra columns (that depend on Hval) with warnings.catch_warnings(): warnings.simplefilter('ignore') for s in uniqStackers: ssoObs = s.run(ssoObs, slicePoint['orbit']['H'], Hval) # Run all the parent metrics. for k in compatibleList: b = self.bundleDict[k] # Mask the parent metric (and then child metrics) if there was no data. if len(ssoObs) == 0: b.metricValues.mask[i][j] = True for cb in list(b.childBundles.values()): cb.metricValues.mask[i][j] = True # Otherwise, calculate the metric value for the parent, and then child. else: # Calculate for the parent. mVal = b.metric.run(ssoObs, slicePoint['orbit'], Hval) # Mask if the parent metric returned a bad value. if mVal == b.metric.badval: b.metricValues.mask[i][j] = True for cb in b.childBundles.values(): cb.metricValues.mask[i][j] = True # Otherwise, set the parent value and calculate the child metric values as well. else: b.metricValues.data[i][j] = mVal for cb in b.childBundles.values(): childVal = cb.metric.run(ssoObs, slicePoint['orbit'], Hval, mVal) if childVal == cb.metric.badval: cb.metricValues.mask[i][j] = True else: cb.metricValues.data[i][j] = childVal for k in compatibleList: b = self.bundleDict[k] b.computeSummaryStats(self.resultsDb) for cB in b.childBundles.values(): cB.computeSummaryStats(self.resultsDb) # Write to disk. cB.write(outDir=self.outDir, resultsDb=self.resultsDb) # Write to disk. b.write(outDir=self.outDir, resultsDb=self.resultsDb)
[docs] def runAll(self): """ Run all constraints and metrics for these moMetricBundles. """ for constraint in self.constraints: self.runConstraint(constraint) if self.verbose: print('Calculated and saved all metrics.')
[docs] def plotAll(self, savefig=True, outfileSuffix=None, figformat='pdf', dpi=600, thumbnail=True, closefigs=True): """ Make a few generically desired plots. This needs more flexibility in the future. """ plotHandler = PlotHandler(outDir=self.outDir, resultsDb=self.resultsDb, savefig=savefig, figformat=figformat, dpi=dpi, thumbnail=thumbnail) for b in self.bundleDict.values(): try: b.plot(plotHandler=plotHandler, outfileSuffix=outfileSuffix, savefig=savefig) except ValueError as ve: message = 'Plotting failed for metricBundle %s.' % (b.fileRoot) message += ' Error message: %s' % (ve.message) warnings.warn(message) if closefigs: plt.close('all') if self.verbose: print('Plotting all metrics.')