# Copyright 2021 Tomoki Hayashi
# Apache 2.0 (http://www.apache.org/licenses/LICENSE-2.0)
"""Text-to-speech abstrast class."""
from abc import ABC, abstractmethod
from typing import Dict, Tuple
import torch
[docs]class AbsTTS(torch.nn.Module, ABC):
"""TTS abstract class."""
[docs] @abstractmethod
def forward(
self,
text: torch.Tensor,
text_lengths: torch.Tensor,
feats: torch.Tensor,
feats_lengths: torch.Tensor,
**kwargs,
) -> Tuple[torch.Tensor, Dict[str, torch.Tensor], torch.Tensor]:
"""Calculate outputs and return the loss tensor."""
raise NotImplementedError
[docs] @abstractmethod
def inference(
self,
text: torch.Tensor,
**kwargs,
) -> Dict[str, torch.Tensor]:
"""Return predicted output as a dict."""
raise NotImplementedError
@property
def require_raw_speech(self):
"""Return whether or not raw_speech is required."""
return False
@property
def require_vocoder(self):
"""Return whether or not vocoder is required."""
return True