Source code for desispec.specstatus

"""
desispec.specstatus
===================

Update surveyops/ops/tile-specstatus.ecsv with spectro pipeline tiles.csv.
"""

import numpy as np
from astropy.table import Table, vstack

from desiutil.log import get_logger


[docs]
def update_specstatus(specstatus, tiles, update_only=False,
                      clear_qa=False):
    """
    return new specstatus table, updated with tiles table

    Args:
        specstatus: astropy Table from surveyops/ops/tiles-specstatus.ecsv
        tiles: astropy Table from spectro/redux/daily/tiles.csv
        update_only: bool don't change entries for tiles that have no new data.
        clear_qa: bool indicating whether QA data should be cleared

    Returns: updated specstatus table, sorted by TILEID

    New TILEID found in tiles are added to specstatus, and any TILEID
    already in specstatus have their non-QA columns updated from the
    entries in tiles.

    If update_only==True, add any new tiles and update non-QA columns
    for tiles with new data (tiles['LASTNIGHT'] > specstatus['LASTNIGHT'])
    but don't change entries for reprocessed tiles that have no new data.

    The QA-related columns that are not changed here are
    USER, QA, OVERRIDE, ZDONE, QANIGHT, and ARCHIVEDATE.

    This does not modify either of the input tables.
    """

    log = get_logger()
    specstatus = specstatus.copy()
    tiles = tiles.copy()

    #- Added for Fuji, but not in tiles-specstatus so remove
    if 'PROGRAM' in tiles.colnames:
        tiles.remove_column('PROGRAM')

    # Quick and dirty fix to keep the tiles file compatible with the specstatus file.
    if 'UPDATED' in tiles.colnames:
        tiles.remove_column('UPDATED')

    #- Confirm that they have the same columns except QA-specific ones
    tilecol = set(tiles.colnames) | set(['USER', 'QA', 'OVERRIDE', 'ZDONE', 'QANIGHT', 'ARCHIVEDATE'])
    if tilecol != set(specstatus.colnames):
        log.error(f'Column mismatch: {tiles.colnames} vs. {specstatus.colnames}')
        raise ValueError('Incompatible specstatus and tiles columns')

    #- even if present in tiles, specstatus trumps for these columns
    #- (i.e. never update them)
    qacols = ['USER', 'QA', 'OVERRIDE', 'ZDONE', 'QANIGHT', 'ARCHIVEDATE']

    #- Add any new tiles
    newtilerows = np.isin(tiles['TILEID'], specstatus['TILEID'], invert=True)
    num_newtiles = np.count_nonzero(newtilerows)
    if num_newtiles > 0:
        tt = list(tiles['TILEID'][newtilerows])
        log.info(f'Adding {num_newtiles} new tiles: {tt}')

        newtiles = tiles[newtilerows]
        newtiles['USER'] = np.repeat('none',num_newtiles)
        newtiles['QA'] = np.repeat('none',num_newtiles)
        newtiles['OVERRIDE'] = np.repeat(0,num_newtiles)
        newtiles['ZDONE'] = np.repeat('false',num_newtiles)
        newtiles['QANIGHT'] = np.repeat(0,num_newtiles)
        newtiles['ARCHIVEDATE'] = np.repeat(0,num_newtiles)
        newtiles = newtiles[specstatus.colnames]  #- columns in same order

        specstatus = vstack([specstatus, newtiles])
    else:
        log.info('No new tiles to add')

    #- At this point, every TILEID in tiles should be in specstatus,
    #- but ok if specstatus has TILEID not in tiles
    assert np.all(np.isin(tiles['TILEID'], specstatus['TILEID']))

    #- For rows with more recent LASTNIGHT (new data), update non-QA columns.
    #- Note: there is probably a more efficient way of doing this in bulk,
    #- but let's favor obvious over clever unless efficiency is needed
    num_updatedtiles = 0
    log.debug('Checking for differences between tiles file and specstatus file')
    for i, tileid in enumerate(tiles['TILEID']):
        j = np.where(specstatus['TILEID'] == tileid)[0][0]
        if not update_only or tiles['LASTNIGHT'][i] > specstatus['LASTNIGHT'][j]:
            different = False
            for col in specstatus.colnames:
                if col not in qacols:
                    if tiles[col][i] != specstatus[col][j]:
                        log.debug('Tile %d updating %s %s -> %s',
                                  tileid, col, str(specstatus[col][j]), str(tiles[col][i]))
                        different = True
            if not different and not clear_qa:
                continue
            log.info('Updating TILEID {} LASTNIGHT {} (orig LASTNIGHT {})'.format(
                tileid, tiles['LASTNIGHT'][i], specstatus['LASTNIGHT'][j]))

            num_updatedtiles += 1
            for col in specstatus.colnames:
                if col not in qacols:
                    specstatus[col][j] = tiles[col][i]
            if clear_qa:
                specstatus['QA'][j] = 'none'

    log.info(f'Added {num_newtiles} and updated {num_updatedtiles} tiles')

    specstatus.sort('TILEID')

    return specstatus