Source code for climada.entity.exposures.base

"""
This file is part of CLIMADA.

Copyright (C) 2017 ETH Zurich, CLIMADA contributors listed in AUTHORS.

CLIMADA is free software: you can redistribute it and/or modify it under the
terms of the GNU Lesser General Public License as published by the Free
Software Foundation, version 3.

CLIMADA is distributed in the hope that it will be useful, but WITHOUT ANY
WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
PARTICULAR PURPOSE.  See the GNU Lesser General Public License for more details.

You should have received a copy of the GNU Lesser General Public License along
with CLIMADA. If not, see <https://www.gnu.org/licenses/>.

---

Define Exposures class.
"""

__all__ = ['Exposures', 'add_sea']

import logging
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from mpl_toolkits.axes_grid1 import make_axes_locatable
from geopandas import GeoDataFrame
import rasterio
from rasterio.warp import Resampling
import contextily as ctx

from climada.entity.tag import Tag
import climada.util.hdf5_handler as hdf5
from climada.util.constants import ONE_LAT_KM, DEF_CRS
import climada.util.coordinates as co
from climada.util.interpolation import interpol_index
import climada.util.plot as u_plot

LOGGER = logging.getLogger(__name__)

INDICATOR_IF = 'if_'
""" Name of the column containing the impact functions id of specified hazard"""

INDICATOR_CENTR = 'centr_'
""" Name of the column containing the centroids id of specified hazard """

DEF_REF_YEAR = 2018
""" Default reference year """

DEF_VALUE_UNIT = 'USD'
""" Default reference year """

DEF_VAR_MAT = {'sup_field_name': 'entity',
               'field_name': 'assets',
               'var_name': {'lat' : 'lat',
                            'lon' : 'lon',
                            'val' : 'Value',
                            'ded' : 'Deductible',
                            'cov' : 'Cover',
                            'imp' : 'DamageFunID',
                            'cat' : 'Category_ID',
                            'reg' : 'Region_ID',
                            'uni' : 'Value_unit',
                            'ass' : 'centroid_index',
                            'ref' : 'reference_year'
                           }
              }
""" MATLAB variable names """

[docs]class Exposures(GeoDataFrame):
    """geopandas GeoDataFrame with metada and columns (pd.Series) defined in
    Attributes.

    Attributes:
        tag (Tag): metada - information about the source data
        ref_year (int): metada - reference year
        value_unit (str): metada - unit of the exposures values
        latitude (pd.Series): latitude
        longitude (pd.Series): longitude
        crs (dict or crs): CRS information inherent to GeoDataFrame.
        value (pd.Series): a value for each exposure
        if_ (pd.Series, optional): e.g. if_TC. impact functions id for hazard TC.
            There might be different hazards defined: if_TC, if_FL, ...
            If not provided, set to default 'if_' with ids 1 in check().
        geometry (pd.Series, optional): geometry of type Point of each instance.
            Computed in method set_geometry_points().
        meta (dict): dictionary containing corresponding raster properties (if any):
            width, height, crs and transform must be present at least (transform needs
            to contain upper left corner!). Exposures might not contain all the points
            of the corresponding raster. Not used in internal computations.
        deductible (pd.Series, optional): deductible value for each exposure
        cover (pd.Series, optional): cover value for each exposure
        category_id (pd.Series, optional): category id for each exposure
        region_id (pd.Series, optional): region id for each exposure
        centr_ (pd.Series, optional): e.g. centr_TC. centroids index for hazard
            TC. There might be different hazards defined: centr_TC, centr_FL, ...
            Computed in method assign_centroids().
    """
    _metadata = GeoDataFrame._metadata + ['tag', 'ref_year', 'value_unit',
                                          'meta']

    vars_oblig = ['value', 'latitude', 'longitude']
    """Name of the variables needed to compute the impact."""

    vars_def = [INDICATOR_IF]
    """Name of variables that can be computed."""

    vars_opt = [INDICATOR_CENTR, 'deductible', 'cover', 'category_id',
                'region_id', 'geometry']
    """Name of the variables that aren't need to compute the impact."""

    @property
    def _constructor(self):
        return Exposures

[docs]    def __init__(self, *args, **kwargs):
        """ Initialize. Copy attributes of input DataFrame. """
        if len(args):
            for var_meta in self._metadata:
                try:
                    val_meta = getattr(args[0], var_meta)
                    setattr(self, var_meta, val_meta)
                except AttributeError:
                    pass
        super(Exposures, self).__init__(*args, **kwargs)

[docs]    def check(self):
        """ Check which variables are present """
        # check metadata
        for var in self._metadata:
            if var[0] == '_':
                continue
            try:
                if getattr(self, var) is None and var == 'crs':
                    self.crs = DEF_CRS
                    LOGGER.info('%s set to default value: %s', var, self.__dict__[var])
            except AttributeError:
                if var == 'tag':
                    self.tag = Tag()
                elif var == 'ref_year':
                    self.ref_year = DEF_REF_YEAR
                elif var == 'value_unit':
                    self.value_unit = DEF_VALUE_UNIT
                elif var == 'meta':
                    self.meta = None
                LOGGER.info('%s metadata set to default value: %s', var, self.__dict__[var])

        for var in self.vars_oblig:
            if not var in self.columns:
                LOGGER.error("%s missing.", var)
                raise ValueError

        for var in self.vars_def:
            if var == INDICATOR_IF:
                found = np.array([var in var_col for var_col in self.columns]).any()
                if INDICATOR_IF in self.columns:
                    LOGGER.info("Hazard type not set in %s", var)
            else:
                found = var in self.columns
            if not found and var == INDICATOR_IF:
                LOGGER.info("Setting %s to default impact functions ids 1.", var)
                self[INDICATOR_IF] = np.ones(self.shape[0], dtype=int)
            elif not found:
                LOGGER.info("%s not set.", var)

        for var in self.vars_opt:
            if var == INDICATOR_CENTR:
                found = np.array([var in var_col for var_col in self.columns]).any()
                if INDICATOR_CENTR in self.columns:
                    LOGGER.info("Hazard type not set in %s", var)
            else:
                found = var in self.columns
            if not found:
                LOGGER.info("%s not set.", var)
            elif var == 'geometry' and \
            (self.geometry.values[0].x != self.longitude.values[0] or \
            self.geometry.values[0].y != self.latitude.values[0]):
                LOGGER.error('Geometry values do not correspond to latitude ' +\
                'and longitude. Use set_geometry_points() or set_lat_lon().')
                raise ValueError

[docs]    def assign_centroids(self, hazard, method='NN', distance='haversine',
                         threshold=100):
        """ Assign for each exposure coordinate closest hazard coordinate.
        -1 used for disatances > threshold in point distances. If raster hazard,
        -1 used for centroids outside raster.

        Parameters:
            hazard (Hazard): hazard to match (with raster or vector centroids)
            method (str, optional): interpolation method to use in vector hazard.
                Nearest neighbor (NN) default
            distance (str, optional): distance to use in vector hazard. Haversine
                default
            threshold (float): distance threshold in km over which no neighbor
                will be found in vector hazard. Those are assigned with a -1.
                Default 100 km.
        """
        LOGGER.info('Matching %s exposures with %s centroids.',
                    str(self.shape[0]), str(hazard.centroids.size))
        if not co.equal_crs(self.crs, hazard.centroids.crs):
            LOGGER.error('Set hazard and exposure to same CRS first!')
            raise ValueError
        if hazard.centroids.meta:
            x_i = ((self.longitude.values - hazard.centroids.meta['transform'][2]) \
                   /hazard.centroids.meta['transform'][0]).astype(int)
            y_i = ((self.latitude.values - hazard.centroids.meta['transform'][5]) \
                   /hazard.centroids.meta['transform'][4]).astype(int)
            assigned = y_i*hazard.centroids.meta['width'] + x_i
            assigned[assigned < 0] = -1
            assigned[assigned >= hazard.centroids.size] = -1
        else:
            coord = np.stack([self.latitude.values, self.longitude.values], axis=1)
            if np.array_equal(coord, hazard.centroids.coord):
                assigned = np.arange(self.shape[0])
            else:
                assigned = interpol_index(hazard.centroids.coord, coord, \
                    method=method, distance=distance, threshold=threshold)

        self[INDICATOR_CENTR + hazard.tag.haz_type] = assigned

[docs]    def set_geometry_points(self, scheduler=None):
        """ Set geometry attribute of GeoDataFrame with Points from latitude and
        longitude attributes.

        Parameter:
            scheduler (str): used for dask map_partitions. “threads”,
                “synchronous” or “processes”
        """
        co.set_df_geometry_points(self, scheduler)

[docs]    def set_lat_lon(self):
        """ Set latitude and longitude attributes from geometry attribute. """
        LOGGER.info('Setting latitude and longitude attributes.')
        self['latitude'] = self.geometry[:].y
        self['longitude'] = self.geometry[:].x

[docs]    def set_from_raster(self, file_name, band=1, src_crs=None, window=False,
                        geometry=False, dst_crs=False, transform=None,
                        width=None, height=None, resampling=Resampling.nearest):
        """ Read raster data and set latitude, longitude, value and meta

        Parameters:
            file_name (str): file name containing values
            band (int, optional): bands to read (starting at 1)
            src_crs (crs, optional): source CRS. Provide it if error without it.
            window (rasterio.windows.Windows, optional): window where data is
                extracted
            geometry (shapely.geometry, optional): consider pixels only in shape
            dst_crs (crs, optional): reproject to given crs
            transform (rasterio.Affine): affine transformation to apply
            wdith (float): number of lons for transform
            height (float): number of lats for transform
            resampling (rasterio.warp,.Resampling optional): resampling
                function used for reprojection to dst_crs
        """
        self.__init__()
        self.tag = Tag()
        self.tag.file_name = file_name
        meta, value = co.read_raster(file_name, [band], src_crs, window,
                                     geometry, dst_crs, transform, width,
                                     height, resampling)
        ulx, xres, _, uly, _, yres = meta['transform'].to_gdal()
        lrx = ulx + meta['width'] * xres
        lry = uly + meta['height'] * yres
        x_grid, y_grid = np.meshgrid(np.arange(ulx+xres/2, lrx, xres),
                                     np.arange(uly+yres/2, lry, yres))
        try:
            self.crs = meta['crs'].to_dict()
        except AttributeError:
            self.crs = meta['crs']
        self['longitude'] = x_grid.flatten()
        self['latitude'] = y_grid.flatten()
        self['value'] = value.reshape(-1)
        self.meta = meta

[docs]    def plot_scatter(self, mask=None, ignore_zero=False, pop_name=True,
                     buffer=0.0, extend='neither', axis=None, **kwargs):
        """Plot exposures geometry's value sum scattered over Earth's map.
        The plot will we projected according to the current crs.

        Parameters:
            mask (np.array, optional): mask to apply to eai_exp plotted.
            ignore_zero (bool, optional): flag to indicate if zero and negative
                values are ignored in plot. Default: False
            pop_name (bool, optional): add names of the populated places
            buffer (float, optional): border to add to coordinates. Default: 0.0.
            extend (str, optional): extend border colorbar with arrows.
                [ 'neither' | 'both' | 'min' | 'max' ]
            axis (matplotlib.axes._subplots.AxesSubplot, optional): axis to use
            kwargs (optional): arguments for scatter matplotlib function, e.g.
                cmap='Greys'. Default: 'Wistia'
         Returns:
            cartopy.mpl.geoaxes.GeoAxesSubplot
        """
        crs_epsg, _ = u_plot.get_transformation(self.crs)
        title = self.tag.description
        cbar_label = 'Value (%s)' % self.value_unit
        if mask is None:
            mask = np.ones((self.shape[0],), dtype=bool)
        if ignore_zero:
            pos_vals = self.value[mask].values > 0
        else:
            pos_vals = np.ones((self.value[mask].values.size,), dtype=bool)
        value = self.value[mask][pos_vals].values
        coord = np.stack([self.latitude[mask][pos_vals].values,
                          self.longitude[mask][pos_vals].values], axis=1)
        return u_plot.geo_scatter_from_array(value, coord, cbar_label, title, \
            pop_name, buffer, extend, proj=crs_epsg, axes=axis, **kwargs)

[docs]    def plot_hexbin(self, mask=None, ignore_zero=False, pop_name=True,
                    buffer=0.0, extend='neither', axis=None, **kwargs):
        """Plot exposures geometry's value sum binned over Earth's map.
        An other function for the bins can be set through the key reduce_C_function.
        The plot will we projected according to the current crs.

        Parameters:
            mask (np.array, optional): mask to apply to eai_exp plotted.
            ignore_zero (bool, optional): flag to indicate if zero and negative
                values are ignored in plot. Default: False
            pop_name (bool, optional): add names of the populated places
            buffer (float, optional): border to add to coordinates. Default: 0.0.
            extend (str, optional): extend border colorbar with arrows.
                [ 'neither' | 'both' | 'min' | 'max' ]
            axis (matplotlib.axes._subplots.AxesSubplot, optional): axis to use
            kwargs (optional): arguments for hexbin matplotlib function, e.g.
                reduce_C_function=np.average. Default: reduce_C_function=np.sum
         Returns:
            cartopy.mpl.geoaxes.GeoAxesSubplot
        """
        crs_epsg, _ = u_plot.get_transformation(self.crs)
        title = self.tag.description
        cbar_label = 'Value (%s)' % self.value_unit
        if 'reduce_C_function' not in kwargs:
            kwargs['reduce_C_function'] = np.sum
        if mask is None:
            mask = np.ones((self.shape[0],), dtype=bool)
        if ignore_zero:
            pos_vals = self.value[mask].values > 0
        else:
            pos_vals = np.ones((self.value[mask].values.size,), dtype=bool)
        value = self.value[mask][pos_vals].values
        coord = np.stack([self.latitude[mask][pos_vals].values,
                          self.longitude[mask][pos_vals].values], axis=1)
        return u_plot.geo_bin_from_array(value, coord, cbar_label, title, \
            pop_name, buffer, extend, proj=crs_epsg, axes=axis, **kwargs)

[docs]    def plot_raster(self, res=None, raster_res=None, save_tiff=None,
                    raster_f=lambda x: np.log10((np.fmax(x+1, 1))),
                    label='value (log10)', scheduler=None, axis=None, **kwargs):
        """ Generate raster from points geometry and plot it using log10 scale:
        np.log10((np.fmax(raster+1, 1))).

        Parameters:
            res (float, optional): resolution of current data in units of latitude
                and longitude, approximated if not provided.
            raster_res (float, optional): desired resolution of the raster
            save_tiff (str, optional): file name to save the raster in tiff
                format, if provided
            raster_f (lambda function): transformation to use to data. Default:
                log10 adding 1.
            label (str): colorbar label
            scheduler (str): used for dask map_partitions. “threads”,
                “synchronous” or “processes”
            axis (matplotlib.axes._subplots.AxesSubplot, optional): axis to use
            kwargs (optional): arguments for imshow matplotlib function

        Returns:
            matplotlib.figure.Figure, cartopy.mpl.geoaxes.GeoAxesSubplot
        """
        if self.meta and self.meta['height']*self.meta['width'] == len(self):
            raster = self.value.values.reshape((self.meta['height'],
                                                self.meta['width']))
            # check raster starts by upper left corner
            if self.latitude.values[0] < self.latitude.values[-1]:
                raster = np.flip(raster, axis=0)
            if self.longitude.values[0] > self.longitude.values[-1]:
                LOGGER.error('Points are not ordered according to meta raster.')
                raise ValueError
        else:
            raster, meta = co.points_to_raster(self, ['value'], res, raster_res,
                                               scheduler)
            raster = raster.reshape((meta['height'], meta['width']))
        # save tiff
        if save_tiff is not None:
            ras_tiff = rasterio.open(save_tiff, 'w', driver='GTiff', \
                height=meta['height'], width=meta['width'], count=1, \
                dtype=np.float32, crs=self.crs, transform=meta['transform'])
            ras_tiff.write(raster.astype(np.float32), 1)
            ras_tiff.close()
        # make plot
        crs_epsg, _ = u_plot.get_transformation(self.crs)
        xmin, ymin, xmax, ymax = self.longitude.min(), self.latitude.min(), \
        self.longitude.max(), self.latitude.max()
        if not axis:
            _, axis = u_plot.make_map(proj=crs_epsg)
        cbar_ax = make_axes_locatable(axis).append_axes('right', size="6.5%", \
            pad=0.1, axes_class=plt.Axes)
        axis.set_extent([max(xmin, crs_epsg.x_limits[0]), \
            min(xmax, crs_epsg.x_limits[1]), max(ymin, crs_epsg.y_limits[0]), \
            min(ymax, crs_epsg.y_limits[1])], crs_epsg)
        u_plot.add_shapes(axis)
        imag = axis.imshow(raster_f(raster), **kwargs, origin='upper',
                           extent=[xmin, xmax, ymin, ymax], transform=crs_epsg)
        plt.colorbar(imag, cax=cbar_ax, label=label)
        plt.draw()
        return axis

[docs]    def plot_basemap(self, mask=None, ignore_zero=False, pop_name=True,
                     buffer=0.0, extend='neither', zoom=10,
                     url='http://tile.stamen.com/terrain/tileZ/tileX/tileY.png',
                     axis=None, **kwargs):
        """ Scatter points over satellite image using contextily

         Parameters:
            mask (np.array, optional): mask to apply to eai_exp plotted. Same
                size of the exposures, only the selected indexes will be plot.
            ignore_zero (bool, optional): flag to indicate if zero and negative
                values are ignored in plot. Default: False
            pop_name (bool, optional): add names of the populated places
            buffer (float, optional): border to add to coordinates. Default: 0.0.
            extend (str, optional): extend border colorbar with arrows.
                [ 'neither' | 'both' | 'min' | 'max' ]
            zoom (int, optional): zoom coefficient used in the satellite image
            url (str, optional): image source, e.g. ctx.sources.OSM_C
            axis (matplotlib.axes._subplots.AxesSubplot, optional): axis to use
            kwargs (optional): arguments for scatter matplotlib function, e.g.
                cmap='Greys'. Default: 'Wistia'

         Returns:
            matplotlib.figure.Figure, cartopy.mpl.geoaxes.GeoAxesSubplot
        """
        if 'geometry' not in self.columns:
            self.set_geometry_points()
        crs_ori = self.crs
        self.to_crs(epsg=3857, inplace=True)
        axis = self.plot_scatter(mask, ignore_zero, pop_name, buffer,
                                 extend, shapes=False, axis=axis, **kwargs)
        ctx.add_basemap(axis, zoom, url, origin='upper')
        axis.set_axis_off()
        self.to_crs(crs_ori, inplace=True)
        return axis

[docs]    def write_hdf5(self, file_name):
        """ Write data frame and metadata in hdf5 format """
        LOGGER.info('Writting %s', file_name)
        store = pd.HDFStore(file_name)
        store.put('exposures', pd.DataFrame(self))

        var_meta = {}
        for var in self._metadata:
            var_meta[var] = getattr(self, var)

        store.get_storer('exposures').attrs.metadata = var_meta
        store.close()

[docs]    def read_hdf5(self, file_name):
        """ Read data frame and metadata in hdf5 format """
        LOGGER.info('Reading %s', file_name)
        with pd.HDFStore(file_name) as store:
            self.__init__(store['exposures'])
            metadata = store.get_storer('exposures').attrs.metadata
            for key, val in metadata.items():
                setattr(self, key, val)

[docs]    def read_mat(self, file_name, var_names=DEF_VAR_MAT):
        """Read MATLAB file and store variables in exposures.

        Parameters:
            file_name (str): absolute path file
            var_names (dict, optional): dictionary containing the name of the
                MATLAB variables. Default: DEF_VAR_MAT.
        """
        LOGGER.info('Reading %s', file_name)
        if var_names is None:
            var_names = DEF_VAR_MAT

        data = hdf5.read(file_name)
        try:
            data = data[var_names['sup_field_name']]
        except KeyError:
            pass

        try:
            data = data[var_names['field_name']]
            exposures = dict()

            _read_mat_obligatory(exposures, data, var_names)
            _read_mat_optional(exposures, data, var_names)
        except KeyError as var_err:
            LOGGER.error("Not existing variable: %s", str(var_err))
            raise var_err

        Exposures.__init__(self, data=exposures)
        _read_mat_metadata(self, data, file_name, var_names)

    #
    # Implement geopandas methods
    #

[docs]    def to_crs(self, crs=None, epsg=None, inplace=False):
        res = super(Exposures, self).to_crs(crs, epsg, inplace)
        if res is not None:
            res.set_lat_lon()
            return res

        self.set_lat_lon()
        return None

    to_crs.__doc__ = GeoDataFrame.to_crs.__doc__

[docs]    def copy(self, deep=True):
        """ Make a copy of this Exposures object.

        Parameters
        ----------
        deep (bool): Make a deep copy, i.e. also copy data. Default True.

        Returns
        -------
            Exposures
        """
        # FIXME: this will likely be unnecessary if removed from GeoDataFrame
        data = self._data
        if deep:
            data = data.copy()
        return Exposures(data).__finalize__(self)

[docs]    def write_raster(self, file_name, value_name='value', scheduler=None):
        """ Write value data into raster file with GeoTiff format

        Parameters:
            file_name (str): name output file in tif format
        """
        if self.meta and self.meta['height']*self.meta['width'] == len(self):
            raster = self[value_name].values.reshape((self.meta['height'],
                                                      self.meta['width']))
            # check raster starts by upper left corner
            if self.latitude.values[0] < self.latitude.values[-1]:
                raster = np.flip(raster, axis=0)
            if self.longitude.values[0] > self.longitude.values[-1]:
                LOGGER.error('Points are not ordered according to meta raster.')
                raise ValueError
            co.write_raster(file_name, raster, self.meta)
        else:
            raster, meta = co.points_to_raster(self, [value_name], scheduler=scheduler)
            co.write_raster(file_name, raster, meta)

[docs]def add_sea(exposures, sea_res):
    """ Add sea to geometry's surroundings with given resolution. region_id
    set to -1 and other variables to 0.

    Parameters:
        sea_res (tuple): (sea_coast_km, sea_res_km), where first parameter
            is distance from coast to fill with water and second parameter
            is resolution between sea points

    Returns:
        Exposures
    """
    LOGGER.info("Adding sea at %s km resolution and %s km distance from coast.",
                str(sea_res[1]), str(sea_res[0]))

    sea_res = (sea_res[0]/ONE_LAT_KM, sea_res[1]/ONE_LAT_KM)

    min_lat = max(-90, float(exposures.latitude.min()) - sea_res[0])
    max_lat = min(90, float(exposures.latitude.max()) + sea_res[0])
    min_lon = max(-180, float(exposures.longitude.min()) - sea_res[0])
    max_lon = min(180, float(exposures.longitude.max()) + sea_res[0])

    lat_arr = np.arange(min_lat, max_lat+sea_res[1], sea_res[1])
    lon_arr = np.arange(min_lon, max_lon+sea_res[1], sea_res[1])

    lon_mgrid, lat_mgrid = np.meshgrid(lon_arr, lat_arr)
    lon_mgrid, lat_mgrid = lon_mgrid.ravel(), lat_mgrid.ravel()
    on_land = np.logical_not(co.coord_on_land(lat_mgrid, lon_mgrid))

    sea_exp = Exposures()
    sea_exp['latitude'] = lat_mgrid[on_land]
    sea_exp['longitude'] = lon_mgrid[on_land]
    sea_exp['region_id'] = np.zeros(sea_exp.latitude.size, int) - 1

    if 'geometry' in exposures.columns:
        sea_exp.set_geometry_points()

    for var_name in exposures.columns:
        if var_name not in ('latitude', 'longitude', 'region_id', 'geometry'):
            sea_exp[var_name] = np.zeros(sea_exp.latitude.size,
                                         exposures[var_name].dtype)

    return pd.concat([exposures, sea_exp], ignore_index=True, sort=False)

def _read_mat_obligatory(exposures, data, var_names):
    """Fill obligatory variables."""
    exposures['value'] = np.squeeze(data[var_names['var_name']['val']])

    exposures['latitude'] = data[var_names['var_name']['lat']].reshape(-1)
    exposures['longitude'] = data[var_names['var_name']['lon']].reshape(-1)

    exposures[INDICATOR_IF] = np.squeeze( \
        data[var_names['var_name']['imp']]).astype(int, copy=False)

def _read_mat_optional(exposures, data, var_names):
    """Fill optional parameters."""
    try:
        exposures['deductible'] = np.squeeze(data[var_names['var_name']['ded']])
    except KeyError:
        pass

    try:
        exposures['cover'] = np.squeeze(data[var_names['var_name']['cov']])
    except KeyError:
        pass

    try:
        exposures['category_id'] = \
        np.squeeze(data[var_names['var_name']['cat']]).astype(int, copy=False)
    except KeyError:
        pass

    try:
        exposures['region_id'] = \
        np.squeeze(data[var_names['var_name']['reg']]).astype(int, copy=False)
    except KeyError:
        pass

    try:
        assigned = np.squeeze(data[var_names['var_name']['ass']]).astype(int, copy=False)
        if assigned.size > 0:
            exposures[INDICATOR_CENTR] = assigned
    except KeyError:
        pass

def _read_mat_metadata(exposures, data, file_name, var_names):
    """ Fille metadata in DataFrame object """
    try:
        exposures.ref_year = int(np.squeeze(data[var_names['var_name']['ref']]))
    except KeyError:
        exposures.ref_year = DEF_REF_YEAR

    try:
        exposures.value_unit = hdf5.get_str_from_ref(file_name, \
            data[var_names['var_name']['uni']][0][0])
    except KeyError:
        exposures.value_unit = DEF_VALUE_UNIT

    exposures.tag = Tag(file_name)