Source code for diffsptk.modules.dct

# ------------------------------------------------------------------------ #
# Copyright 2022 SPTK Working Group                                        #
#                                                                          #
# Licensed under the Apache License, Version 2.0 (the "License");          #
# you may not use this file except in compliance with the License.         #
# You may obtain a copy of the License at                                  #
#                                                                          #
#     http://www.apache.org/licenses/LICENSE-2.0                           #
#                                                                          #
# Unless required by applicable law or agreed to in writing, software      #
# distributed under the License is distributed on an "AS IS" BASIS,        #
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. #
# See the License for the specific language governing permissions and      #
# limitations under the License.                                           #
# ------------------------------------------------------------------------ #

import torch
from torch import nn

from ..misc.utils import check_size
from ..misc.utils import plateau
from ..misc.utils import to



[docs]
class DiscreteCosineTransform(nn.Module):
    """See `this page <https://sp-nitech.github.io/sptk/latest/main/dct.html>`_
    for details.

    Parameters
    ----------
    dct_length : int >= 1
        DCT length, :math:`L`.

    dct_type : int in [1, 4]
        DCT type.

    """

    def __init__(self, dct_length, dct_type=2):
        super().__init__()

        assert 1 <= dct_length
        assert 1 <= dct_type <= 4

        self.dct_length = dct_length
        self.register_buffer("W", self._precompute(dct_length, dct_type))


[docs]
    def forward(self, x):
        """Apply DCT to input.

        Parameters
        ----------
        x : Tensor [shape=(..., L)]
            Input.

        Returns
        -------
        out : Tensor [shape=(..., L)]
            DCT output.

        Examples
        --------
        >>> x = diffsptk.ramp(3)
        >>> dct = diffsptk.DCT(4)
        >>> y = dct(x)
        >>> y
        tensor([ 3.0000, -2.2304,  0.0000, -0.1585])

        """
        check_size(x.size(-1), self.dct_length, "dimension of input")
        return self._forward(x, self.W)


    @staticmethod
    def _forward(x, W):
        return torch.matmul(x, W)

    @staticmethod
    def _func(x, dct_type):
        W = DiscreteCosineTransform._precompute(
            x.size(-1), dct_type, dtype=x.dtype, device=x.device
        )
        return DiscreteCosineTransform._forward(x, W)

    @staticmethod
    def _precompute(length, dct_type, dtype=None, device=None):
        L = length
        n = torch.arange(L, dtype=torch.double, device=device)
        k = torch.arange(L, dtype=torch.double, device=device)
        if dct_type == 2 or dct_type == 4:
            n += 0.5
        if dct_type == 3 or dct_type == 4:
            k += 0.5
        n *= torch.pi / ((L - 1) if dct_type == 1 else L)

        if dct_type == 1:
            c = (1 / 2) ** 0.5
            z0 = plateau(L, c, 1, c, dtype=torch.double, device=device)
            z1 = plateau(L, 1, 2, 1, dtype=torch.double, device=device)
            z = z0.unsqueeze(0) * torch.sqrt(z1 / (L - 1)).unsqueeze(1)
        elif dct_type == 2:
            z = plateau(L, 1, 2, dtype=torch.double, device=device)
            z = torch.sqrt(z / L).unsqueeze(0)
        elif dct_type == 3:
            z = plateau(L, 1, 2, dtype=torch.double, device=device)
            z = torch.sqrt(z / L).unsqueeze(1)
        elif dct_type == 4:
            z = (2 / L) ** 0.5
        else:
            raise ValueError
        W = z * torch.cos(k.unsqueeze(0) * n.unsqueeze(1))
        return to(W, dtype=dtype)