# coding: utf-8
# Licensed under a 3-clause BSD style license - see LICENSE.rst

import numpy as np
from numpy.testing import assert_array_equal
import pytest

from astropy import units as u
from astropy.table import QTable, hstack, vstack, join

from astropy.utils.masked import Masked
from astropy.utils.compat.optional_deps import HAS_H5PY

from .test_masked import assert_masked_equal


FILE_FORMATS = ['ecsv', 'fits']
if HAS_H5PY:
    FILE_FORMATS.append('h5')


class MaskedArrayTableSetup:
    @classmethod
    def setup_arrays(self):
        self.a = np.array([3., 5., 0.])
        self.mask_a = np.array([True, False, False])

    @classmethod
    def setup_class(self):
        self.setup_arrays()
        self.ma = Masked(self.a, mask=self.mask_a)
        self.ma.info.format = '.1f'
        self.t = QTable([self.ma], names=['ma'])


class MaskedQuantityTableSetup(MaskedArrayTableSetup):
    @classmethod
    def setup_arrays(self):
        self.a = np.array([3., 5., 0.]) << u.m
        self.mask_a = np.array([True, False, False])


class TestMaskedArrayTable(MaskedArrayTableSetup):
    def test_table_initialization(self):
        assert_array_equal(self.t['ma'].unmasked, self.a)
        assert_array_equal(self.t['ma'].mask, self.mask_a)
        assert repr(self.t).splitlines()[-3:] == [
            '    ———',
            '    5.0',
            '    0.0']

    def test_info_basics(self):
        assert self.t['ma'].info.name == 'ma'
        assert 'serialize_method' in self.t['ma'].info.attr_names
        t2 = self.t.copy()
        t2['ma'].info.format = '.2f'
        t2['ma'].info.serialize_method['fits'] = 'nonsense'
        assert repr(t2).splitlines()[-3:] == [
            '    ———',
            '   5.00',
            '   0.00']
        # Check that if we slice, things get copied over correctly.
        t3 = t2[:2]
        assert t3['ma'].info.name == 'ma'
        assert t3['ma'].info.format == '.2f'
        assert 'serialize_method' in t3['ma'].info.attr_names
        assert t3['ma'].info.serialize_method['fits'] == 'nonsense'

    @pytest.mark.parametrize('file_format', FILE_FORMATS)
    def test_table_write(self, file_format, tmpdir):
        name = str(tmpdir.join(f"a.{file_format}"))
        kwargs = {}
        if file_format == 'h5':
            kwargs['path'] = 'trial'
            kwargs['serialize_meta'] = True

        self.t.write(name, **kwargs)
        t2 = QTable.read(name)
        assert isinstance(t2['ma'], self.ma.__class__)
        assert np.all(t2['ma'] == self.ma)
        assert np.all(t2['ma'].mask == self.mask_a)
        if file_format == 'fits':
            # Imperfect roundtrip through FITS native format description.
            assert self.t['ma'].info.format in t2['ma'].info.format
        else:
            assert t2['ma'].info.format == self.t['ma'].info.format

    @pytest.mark.parametrize('serialize_method', ['data_mask', 'null_value'])
    def test_table_write_serialization(self, serialize_method, tmpdir):
        name = str(tmpdir.join("test.ecsv"))
        self.t.write(name, serialize_method=serialize_method)
        with open(name) as fh:
            lines = fh.readlines()

        t2 = QTable.read(name)
        assert isinstance(t2['ma'], self.ma.__class__)

        if serialize_method == 'data_mask':
            # Will data_mask, we have data and mask columns and should
            # exactly round-trip.
            assert len(lines[-1].split()) == 2
            assert_masked_equal(t2['ma'], self.ma)
        else:
            # With null_value we have just a data column with null values
            # marked, so we lost information on the data below the mask.
            assert len(lines[-1].split()) == 1
            assert np.all(t2['ma'] == self.ma)
            assert np.all(t2['ma'].mask == self.mask_a)

    def test_non_existing_serialize_method(self, tmpdir):
        name = str(tmpdir.join('bad.ecsv'))
        with pytest.raises(ValueError, match='serialize method must be'):
            self.t.write(name, serialize_method='bad_serialize_method')


class TestMaskedQuantityTable(TestMaskedArrayTable, MaskedQuantityTableSetup):
    # Runs tests from TestMaskedArrayTable as well as some extra ones.
    def test_table_operations_requiring_masking(self):
        t1 = self.t
        t2 = QTable({'ma2': Masked([1, 2] * u.m)})
        t12 = hstack([t1, t2], join_type='outer')
        assert np.all(t12['ma'].mask == [True, False, False])
        # 'ma2' is shorter by one so we expect one True from hstack so length matches
        assert np.all(t12['ma2'].mask == [False, False, True])

        t12 = hstack([t1, t2], join_type='inner')
        assert np.all(t12['ma'].mask == [True, False])
        assert np.all(t12['ma2'].mask == [False, False])

        # Vstack tables with different column names. In this case we get masked
        # values
        t12 = vstack([t1, t2], join_type='outer')
        #  ma ma2
        #  m   m
        # --- ---
        #  ——  ——
        # 5.0  ——
        # 0.0  ——
        #  —— 1.0
        #  —— 2.0
        assert np.all(t12['ma'].mask == [True, False, False, True, True])
        assert np.all(t12['ma2'].mask == [True, True, True, False, False])

    def test_table_operations_requiring_masking_auto_promote(self):
        MaskedQuantity = Masked(u.Quantity)
        t1 = QTable({'ma1': [1, 2] * u.m})
        t2 = QTable({'ma2': [3, 4, 5] * u.m})
        t12 = hstack([t1, t2], join_type='outer')
        assert isinstance(t12['ma1'], MaskedQuantity)
        assert np.all(t12['ma1'].mask == [False, False, True])
        assert np.all(t12['ma1'] == [1, 2, 0] * u.m)
        assert not isinstance(t12['ma2'], MaskedQuantity)
        assert isinstance(t12['ma2'], u.Quantity)
        assert np.all(t12['ma2'] == [3, 4, 5] * u.m)

        t12 = hstack([t1, t2], join_type='inner')
        assert isinstance(t12['ma1'], u.Quantity)
        assert not isinstance(t12['ma1'], MaskedQuantity)
        assert isinstance(t12['ma2'], u.Quantity)
        assert not isinstance(t12['ma2'], MaskedQuantity)

        # Vstack tables with different column names. In this case we get masked
        # values
        t12 = vstack([t1, t2], join_type='outer')
        assert np.all(t12['ma1'].mask == [False, False, True, True, True])
        assert np.all(t12['ma2'].mask == [True, True, False, False, False])

        t1['a'] = [1, 2]
        t2['a'] = [1, 3, 4]
        t12 = join(t1, t2, join_type='outer')
        assert np.all(t12['ma1'].mask == [False, False, True, True])
        assert np.all(t12['ma2'].mask == [False, True, False, False])