Source code for satpy.readers.olci_nc

#!/usr/bin/env python
# -*- coding: utf-8 -*-
# Copyright (c) 2016 Satpy developers
#
# This file is part of satpy.
#
# satpy is free software: you can redistribute it and/or modify it under the
# terms of the GNU General Public License as published by the Free Software
# Foundation, either version 3 of the License, or (at your option) any later
# version.
#
# satpy is distributed in the hope that it will be useful, but WITHOUT ANY
# WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR
# A PARTICULAR PURPOSE.  See the GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License along with
# satpy.  If not, see <http://www.gnu.org/licenses/>.
"""Sentinel-3 OLCI reader.

This reader supports an optional argument to choose the 'engine' for reading
OLCI netCDF4 files. By default, this reader uses the default xarray choice of
engine, as defined in the :func:`xarray.open_dataset` documentation`.

As an alternative, the user may wish to use the 'h5netcdf' engine, but that is
not default as it typically prints many non-fatal but confusing error messages
to the terminal.
To choose between engines the user can  do as follows for the default::

    scn = Scene(filenames=my_files, reader='olci_l1b')

or as follows for the h5netcdf engine::

    scn = Scene(filenames=my_files,
                reader='olci_l1b', reader_kwargs={'engine': 'h5netcdf'})

References:
    - :func:`xarray.open_dataset`

"""


import logging
from functools import reduce

import dask.array as da
import numpy as np
import xarray as xr

from satpy._compat import cached_property
from satpy.readers import open_file_or_filename
from satpy.readers.file_handlers import BaseFileHandler
from satpy.utils import angle2xyz, get_legacy_chunk_size, xyz2angle

DEFAULT_MASK_ITEMS = ["INVALID", "SNOW_ICE", "INLAND_WATER", "SUSPECT",
                      "AC_FAIL", "CLOUD", "HISOLZEN", "OCNN_FAIL",
                      "CLOUD_MARGIN", "CLOUD_AMBIGUOUS", "LOWRW", "LAND"]

logger = logging.getLogger(__name__)

CHUNK_SIZE = get_legacy_chunk_size()

PLATFORM_NAMES = {"S3A": "Sentinel-3A",
                  "S3B": "Sentinel-3B",
                  "ENV": "Environmental Satellite"}



[docs]
class BitFlags:
    """Manipulate flags stored bitwise."""

    def __init__(self, value, flag_list=None):
        """Init the flags."""
        self._value = value

        if flag_list is None:
            try:
                meanings = value.attrs["flag_meanings"].split()
                masks = value.attrs["flag_masks"]
            except (AttributeError, KeyError):
                meanings = ["INVALID", "WATER", "LAND", "CLOUD", "SNOW_ICE",
                            "INLAND_WATER", "TIDAL", "COSMETIC", "SUSPECT",
                            "HISOLZEN", "SATURATED", "MEGLINT", "HIGHGLINT",
                            "WHITECAPS", "ADJAC", "WV_FAIL", "PAR_FAIL",
                            "AC_FAIL", "OC4ME_FAIL", "OCNN_FAIL",
                            "Extra_1",
                            "KDM_FAIL",
                            "Extra_2",
                            "CLOUD_AMBIGUOUS", "CLOUD_MARGIN", "BPAC_ON", "WHITE_SCATT",
                            "LOWRW", "HIGHRW"]
                self.meaning = {meaning: mask for mask, meaning in enumerate(meanings)}
            else:
                self.meaning = {meaning: int(np.log2(mask)) for meaning, mask in zip(meanings, masks)}
        else:
            self.meaning = {meaning: mask for mask, meaning in enumerate(flag_list)}

    def __getitem__(self, item):
        """Get the item."""
        pos = self.meaning[item]
        data = self._value
        if isinstance(data, xr.DataArray):
            data = data.data
            res = ((data >> pos) % 2).astype(bool)
            res = xr.DataArray(res, coords=self._value.coords,
                               attrs=self._value.attrs,
                               dims=self._value.dims)
        else:
            res = ((data >> pos) % 2).astype(bool)
        return res




[docs]
class NCOLCIBase(BaseFileHandler):
    """The OLCI reader base."""

    rows_name = "rows"
    cols_name = "columns"

    def __init__(self, filename, filename_info, filetype_info,
                 engine=None, **kwargs):
        """Init the olci reader base."""
        super().__init__(filename, filename_info, filetype_info)
        self._engine = engine
        self._start_time = filename_info["start_time"]
        self._end_time = filename_info["end_time"]
        # TODO: get metadata from the manifest file (xfdumanifest.xml)
        self.platform_name = PLATFORM_NAMES[filename_info["mission_id"]]
        self.sensor = "olci"

    @cached_property
    def nc(self):
        """Get the nc xr dataset."""
        f_obj = open_file_or_filename(self.filename)
        dataset = xr.open_dataset(f_obj,
                                  decode_cf=True,
                                  mask_and_scale=True,
                                  engine=self._engine,
                                  chunks={self.cols_name: CHUNK_SIZE,
                                          self.rows_name: CHUNK_SIZE})
        return dataset.rename({self.cols_name: "x", self.rows_name: "y"})

    @property
    def start_time(self):
        """Start time property."""
        return self._start_time

    @property
    def end_time(self):
        """End time property."""
        return self._end_time


[docs]
    def get_dataset(self, key, info):
        """Load a dataset."""
        logger.debug("Reading %s.", key["name"])
        variable = self.nc[key["name"]]

        return variable





[docs]
class NCOLCICal(NCOLCIBase):
    """Dummy class for calibration."""




[docs]
class NCOLCIGeo(NCOLCIBase):
    """Dummy class for navigation."""




[docs]
class NCOLCIChannelBase(NCOLCIBase):
    """Base class for channel reading."""

    def __init__(self, filename, filename_info, filetype_info, engine=None):
        """Init the file handler."""
        super().__init__(filename, filename_info, filetype_info, engine)
        self.channel = filename_info.get("dataset_name")
        self.reflectance_prefix = "Oa"
        self.reflectance_suffix = "_reflectance"




[docs]
class NCOLCI1B(NCOLCIChannelBase):
    """File handler for OLCI l1b."""

    def __init__(self, filename, filename_info, filetype_info, cal, engine=None):
        """Init the file handler."""
        super().__init__(filename, filename_info, filetype_info, engine)
        self.cal = cal.nc


[docs]
    @staticmethod
    def _get_items(idx, solar_flux):
        """Get items."""
        return solar_flux[idx]



[docs]
    def _get_solar_flux(self, band):
        """Get the solar flux for the band."""
        solar_flux = self.cal["solar_flux"].isel(bands=band).values
        d_index = self.cal["detector_index"].fillna(0).astype(int)

        return da.map_blocks(self._get_items, d_index.data,
                             solar_flux=solar_flux, dtype=solar_flux.dtype)



[docs]
    def get_dataset(self, key, info):
        """Load a dataset."""
        if self.channel != key["name"]:
            return
        logger.debug("Reading %s.", key["name"])

        radiances = self.nc[self.channel + "_radiance"]

        if key["calibration"] == "reflectance":
            idx = int(key["name"][2:]) - 1
            sflux = self._get_solar_flux(idx)
            radiances = radiances / sflux * np.pi * 100
            radiances.attrs["units"] = "%"

        radiances.attrs["platform_name"] = self.platform_name
        radiances.attrs["sensor"] = self.sensor
        radiances.attrs.update(key.to_dict())
        return radiances





[docs]
class NCOLCI2(NCOLCIChannelBase):
    """File handler for OLCI l2."""

    def __init__(self, filename, filename_info, filetype_info, engine=None, unlog=False, mask_items=None):
        """Init the file handler."""
        super().__init__(filename, filename_info, filetype_info, engine)
        self.unlog = unlog
        self.mask_items = mask_items


[docs]
    def get_dataset(self, key, info):
        """Load a dataset."""
        if self.channel is not None and self.channel != key["name"]:
            return
        logger.debug("Reading %s.", key["name"])
        if self.channel is not None and self.channel.startswith(self.reflectance_prefix):
            dataset = self.nc[self.channel + self.reflectance_suffix]
        else:
            dataset = self.nc[info["nc_key"]]

        if key["name"] == "wqsf":
            dataset.attrs["_FillValue"] = 1
        elif key["name"] == "mask":
            dataset = self.getbitmask(dataset, self.mask_items)
        dataset.attrs["platform_name"] = self.platform_name
        dataset.attrs["sensor"] = self.sensor
        dataset.attrs.update(key.to_dict())
        if self.unlog:
            dataset = self.delog(dataset)

        return dataset



[docs]
    def delog(self, data_array):
        """Remove log10 from the units and values."""
        units = data_array.attrs["units"]

        if units.startswith("lg("):
            data_array = 10 ** data_array
            data_array.attrs["units"] = units.split("lg(re ")[1].strip(")")
        return data_array



[docs]
    def getbitmask(self, wqsf, items=None):
        """Get the bitmask."""
        if items is None:
            items = DEFAULT_MASK_ITEMS
        bflags = BitFlags(wqsf)
        return reduce(np.logical_or, [bflags[item] for item in items])





[docs]
class NCOLCILowResData(NCOLCIBase):
    """Handler for low resolution data."""

    rows_name = "tie_rows"
    cols_name = "tie_columns"

    def __init__(self, filename, filename_info, filetype_info,
                 engine=None, **kwargs):
        """Init the file handler."""
        super().__init__(filename, filename_info, filetype_info, engine)
        self.l_step = self.nc.attrs["al_subsampling_factor"]
        self.c_step = self.nc.attrs["ac_subsampling_factor"]


[docs]
    def _do_interpolate(self, data):

        if not isinstance(data, tuple):
            data = (data,)

        shape = data[0].shape

        from geotiepoints.interpolator import Interpolator
        tie_lines = np.arange(0, (shape[0] - 1) * self.l_step + 1, self.l_step)
        tie_cols = np.arange(0, (shape[1] - 1) * self.c_step + 1, self.c_step)
        lines = np.arange((shape[0] - 1) * self.l_step + 1)
        cols = np.arange((shape[1] - 1) * self.c_step + 1)
        along_track_order = 1
        cross_track_order = 3
        satint = Interpolator([x.values for x in data],
                              (tie_lines, tie_cols),
                              (lines, cols),
                              along_track_order,
                              cross_track_order)
        int_data = satint.interpolate()

        return [xr.DataArray(da.from_array(x, chunks=(CHUNK_SIZE, CHUNK_SIZE)),
                             dims=["y", "x"]) for x in int_data]


    @property
    def _need_interpolation(self):
        return (self.c_step != 1 or self.l_step != 1)




[docs]
class NCOLCIAngles(NCOLCILowResData):
    """File handler for the OLCI angles."""

    datasets = {"satellite_azimuth_angle": "OAA",
                "satellite_zenith_angle": "OZA",
                "solar_azimuth_angle": "SAA",
                "solar_zenith_angle": "SZA"}


[docs]
    def get_dataset(self, key, info):
        """Load a dataset."""
        if key["name"] not in self.datasets:
            return

        logger.debug("Reading %s.", key["name"])

        if self._need_interpolation:
            if key["name"].startswith("satellite"):
                azi, zen = self.satellite_angles
            elif key["name"].startswith("solar"):
                azi, zen = self.sun_angles
            else:
                raise NotImplementedError("Don't know how to read " + key["name"])

            if "zenith" in key["name"]:
                values = zen
            elif "azimuth" in key["name"]:
                values = azi
            else:
                raise NotImplementedError("Don't know how to read " + key["name"])
        else:
            values = self.nc[self.datasets[key["name"]]]

        values.attrs["platform_name"] = self.platform_name
        values.attrs["sensor"] = self.sensor

        values.attrs.update(key.to_dict())
        return values


    @cached_property
    def sun_angles(self):
        """Return the sun angles."""
        zen = self.nc[self.datasets["solar_zenith_angle"]]
        azi = self.nc[self.datasets["solar_azimuth_angle"]]
        azi, zen = self._interpolate_angles(azi, zen)
        return azi, zen

    @cached_property
    def satellite_angles(self):
        """Return the satellite angles."""
        zen = self.nc[self.datasets["satellite_zenith_angle"]]
        azi = self.nc[self.datasets["satellite_azimuth_angle"]]
        azi, zen = self._interpolate_angles(azi, zen)
        return azi, zen


[docs]
    def _interpolate_angles(self, azi, zen):
        aattrs = azi.attrs
        zattrs = zen.attrs
        x, y, z = angle2xyz(azi, zen)
        x, y, z = self._do_interpolate((x, y, z))
        azi, zen = xyz2angle(x, y, z)
        azi.attrs = aattrs
        zen.attrs = zattrs
        return azi, zen





[docs]
class NCOLCIMeteo(NCOLCILowResData):
    """File handler for the OLCI meteo data."""

    datasets = ["humidity", "sea_level_pressure", "total_columnar_water_vapour", "total_ozone"]

    def __init__(self, filename, filename_info, filetype_info,
                 engine=None):
        """Init the file handler."""
        super().__init__(filename, filename_info, filetype_info, engine)
        self.cache = {}

    # TODO: the following depends on more than columns, rows
    # float atmospheric_temperature_profile(tie_rows, tie_columns, tie_pressure_levels) ;
    # float horizontal_wind(tie_rows, tie_columns, wind_vectors) ;
    # float reference_pressure_level(tie_pressure_levels) ;


[docs]
    def get_dataset(self, key, info):
        """Load a dataset."""
        if key["name"] not in self.datasets:
            return

        logger.debug("Reading %s.", key["name"])

        if self._need_interpolation and self.cache.get(key["name"]) is None:

            data = self.nc[key["name"]]

            values, = self._do_interpolate(data)
            values.attrs = data.attrs

            self.cache[key["name"]] = values

        elif key["name"] in self.cache:
            values = self.cache[key["name"]]
        else:
            values = self.nc[key["name"]]

        values.attrs["platform_name"] = self.platform_name
        values.attrs["sensor"] = self.sensor

        values.attrs.update(key.to_dict())
        return values