Source code for diffsptk.modules.lpc2lsp

# ------------------------------------------------------------------------ #
# Copyright 2022 SPTK Working Group                                        #
#                                                                          #
# Licensed under the Apache License, Version 2.0 (the "License");          #
# you may not use this file except in compliance with the License.         #
# You may obtain a copy of the License at                                  #
#                                                                          #
#     http://www.apache.org/licenses/LICENSE-2.0                           #
#                                                                          #
# Unless required by applicable law or agreed to in writing, software      #
# distributed under the License is distributed on an "AS IS" BASIS,        #
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. #
# See the License for the specific language governing permissions and      #
# limitations under the License.                                           #
# ------------------------------------------------------------------------ #

import torch
from torch import nn
import torch.nn.functional as F

from ..misc.utils import TWO_PI
from ..misc.utils import check_size
from ..misc.utils import deconv1d
from .root_pol import PolynomialToRoots



[docs]
class LinearPredictiveCoefficientsToLineSpectralPairs(nn.Module):
    """See `this page <https://sp-nitech.github.io/sptk/latest/main/lpc2lsp.html>`_
    for details.

    Parameters
    ----------
    lpc_order : int >= 0
        Order of LPC, :math:`M`.

    log_gain : bool
        If True, output gain in log scale.

    sample_rate : int >= 1 or None
        Sample rate in Hz.

    out_format : ['radian', 'cycle', 'khz', 'hz']
        Output format.

    """

    def __init__(
        self, lpc_order, log_gain=False, sample_rate=None, out_format="radian"
    ):
        super().__init__()

        assert 0 <= lpc_order

        self.lpc_order = lpc_order
        self.log_gain = log_gain
        self.formatter = self._formatter(out_format, sample_rate)
        kernel_p, kernel_q = self._precompute(self.lpc_order)
        self.register_buffer("kernel_p", kernel_p)
        self.register_buffer("kernel_q", kernel_q)


[docs]
    def forward(self, a):
        """Convert LPC to LSP.

        Parameters
        ----------
        a : Tensor [shape=(..., M+1)]
            LPC coefficients.

        Returns
        -------
        out : Tensor [shape=(..., M+1)]
            LSP frequencies.

        Examples
        --------
        >>> x = diffsptk.nrand(4)
        >>> x
        tensor([-1.5326,  1.0875, -1.5925,  0.6913,  1.6217])
        >>> lpc = diffsptk.LPC(3, 5)
        >>> a = lpc(x)
        >>> a
        tensor([ 2.7969,  0.3908,  0.0458, -0.0859])
        >>> lpc2lsp = diffsptk.LinearPredictiveCoefficientsToLineSpectralPairs(3)
        >>> w = lpc2lsp(a)
        >>> w
        tensor([2.7969, 0.9037, 1.8114, 2.4514])

        """
        check_size(a.size(-1), self.lpc_order + 1, "dimension of LPC")
        return self._forward(
            a, self.log_gain, self.formatter, self.kernel_p, self.kernel_q
        )


    @staticmethod
    def _forward(a, log_gain, formatter, kernel_p, kernel_q):
        M = a.size(-1) - 1
        K, a = torch.split(a, [1, M], dim=-1)

        if log_gain:
            K = torch.log(K)
        if M == 0:
            return K

        a0 = F.pad(a, (1, 0), value=1)
        a1 = F.pad(a0, (0, 1), value=0)
        a2 = a1.flip(-1)
        p = a1 - a2
        q = a1 + a2
        if M == 1:
            q = PolynomialToRoots._func(q)
            w = torch.angle(q[..., 0])
        else:
            p = deconv1d(p, kernel_p)
            q = deconv1d(q, kernel_q)
            p = PolynomialToRoots._func(p)
            q = PolynomialToRoots._func(q)
            p = torch.angle(p[..., 0::2])
            q = torch.angle(q[..., 0::2])
            w, _ = torch.sort(torch.cat((p, q), dim=-1))

        w = w.view_as(a)
        w = formatter(w)
        w = torch.cat((K, w), dim=-1)
        return w

    @staticmethod
    def _func(a, log_gain, sample_rate, out_format):
        formatter = LinearPredictiveCoefficientsToLineSpectralPairs._formatter(
            out_format, sample_rate
        )
        kernels = LinearPredictiveCoefficientsToLineSpectralPairs._precompute(
            a.size(-1) - 1, dtype=a.dtype, device=a.device
        )
        return LinearPredictiveCoefficientsToLineSpectralPairs._forward(
            a, log_gain, formatter, *kernels
        )

    @staticmethod
    def _precompute(lpc_order, dtype=None, device=None):
        if lpc_order % 2 == 0:
            kernel_p = torch.tensor([1.0, -1.0], device=device)
            kernel_q = torch.tensor([1.0, 1.0], device=device)
        else:
            kernel_p = torch.tensor([1.0, 0.0, -1.0], device=device)
            kernel_q = torch.tensor([1.0], device=device)
        return kernel_p, kernel_q

    @staticmethod
    def _formatter(out_format, sample_rate):
        if out_format in (0, "radian"):
            return lambda x: x
        elif out_format in (1, "cycle"):
            return lambda x: x / TWO_PI
        elif out_format in (2, "khz"):
            assert sample_rate is not None and 0 < sample_rate
            return lambda x: x * (sample_rate / 1000 / TWO_PI)
        elif out_format in (3, "hz"):
            assert sample_rate is not None and 0 < sample_rate
            return lambda x: x * (sample_rate / TWO_PI)
        raise ValueError(f"out_format {out_format} is not supported.")