OpenVoiceOS
diff --git a/‎mycroft/tts/__init__.py‎
Lines changed: 7 additions & 19 deletions b/‎mycroft/tts/__init__.py‎
Lines changed: 7 additions & 19 deletions
diff --git a/‎mycroft/tts/cache.py‎
Lines changed: 8 additions & 338 deletions b/‎mycroft/tts/cache.py‎
Lines changed: 8 additions & 338 deletions
@@ -1,20 +1,8 @@
-# Copyright 2017 Mycroft AI Inc.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-#
-"""The TTS module contains TTS classes for interfacing with various TTS
-services. This includes both local and remote services. The module also
-declares a "factory" for spawning a TTS service based on configuration.
 """
-
-from mycroft.tts.tts import TTSFactory, TTS, TTSValidator, PlaybackThread
+NOTE: this is dead code! do not use!
+This file is only present to ensure backwards compatibility
+in case someone is importing from here
+This is only meant for 3rd party code expecting ovos-core
+to be a drop in replacement for mycroft-core
+"""
+from mycroft.tts.tts import TTSFactory, TTS, TTSValidator, PlaybackThread
@@ -1,339 +1,9 @@
-# Copyright 2021 Mycroft AI Inc.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""TTS cache maintenance.
-
-There are two types of cache available to a TTS engine.  Both are comprised of
-audio and phoneme files.  TTS engines can use the cache to improve performance
-by not performing inference on sentences in the cache.
-
-The first type of cache is a persistent cache.  The cache is considered
-persistent because the files are stored in a location that is not cleared on
-reboot.  TTS inference on these sentences should only need to occur once.  The
-persistent cache contains commonly spoken sentences.
-
-The second cache type is a temporary cache stored in the /tmp directory,
-which is cleared when a device is rebooted.  Sentences are added to this cache
-on the fly every time a TTS engine returns audio for a sentence that is not
-already cached.
 """
-import base64
-import hashlib
-import json
-import re
-from pathlib import Path
-from typing import List, Set, Tuple
-from urllib import parse
-
-import requests
-
-from mycroft.util.file_utils import (
-    ensure_directory_exists, get_cache_directory, curate_cache
-)
-from mycroft.util.log import LOG
-
-
-def _get_mimic2_audio(sentence: str, url: str) -> Tuple[bytes, str]:
-    """Use the Mimic2 API to retrieve the audio for a sentence.
-
-    Args:
-        sentence: The sentence to be cached
-    """
-    LOG.debug("Retrieving Mimic2 audio for sentence \"{}\'".format(sentence))
-    mimic2_url = url + parse.quote(sentence) + '&visimes=True'
-    response = requests.get(mimic2_url)
-    response_data = response.json()
-    audio = base64.b64decode(response_data["audio_base64"])
-    phonemes = response_data["visimes"]
-
-    return audio, phonemes
-
-
-def hash_sentence(sentence: str):
-    """Convert the sentence into a hash value used for the file name
-
-    Args:
-        sentence: The sentence to be cached
-    """
-    encoded_sentence = sentence.encode("utf-8", "ignore")
-    sentence_hash = hashlib.md5(encoded_sentence).hexdigest()
-
-    return sentence_hash
-
-
-def hash_from_path(path: Path) -> str:
-    """Returns hash from a given path.
-
-    Simply removes extension and folder structure leaving the hash.
-
-    Args:
-        path: path to get hash from
-
-    Returns:
-        Hash reference for file.
-    """
-    return path.with_suffix('').name
-
-
-class AudioFile:
-    def __init__(self, cache_dir: Path, sentence_hash: str, file_type: str):
-        self.name = f"{sentence_hash}.{file_type}"
-        self.path = cache_dir.joinpath(self.name)
-
-    def save(self, audio: bytes):
-        """Write a TTS cache file containing the audio to be spoken.
-
-        Args:
-            audio: TTS inference of a sentence
-        """
-        try:
-            with open(self.path, "wb") as audio_file:
-                audio_file.write(audio)
-        except Exception:
-            LOG.exception("Failed to write {} to cache".format(self.name))
-
-    def exists(self):
-        return self.path.exists()
-
-
-class PhonemeFile:
-    def __init__(self, cache_dir: Path, sentence_hash: str):
-        self.name = f"{sentence_hash}.pho"
-        self.path = cache_dir.joinpath(self.name)
-
-    def load(self) -> List:
-        """Load phonemes from cache file."""
-        phonemes = None
-        if self.path.exists():
-            try:
-                with open(self.path) as phoneme_file:
-                    phonemes = phoneme_file.read().strip()
-            except Exception:
-                LOG.exception("Failed to read phoneme from cache")
-
-        return json.loads(phonemes)
-
-    def save(self, phonemes):
-        """Write a TTS cache file containing the phoneme to be displayed.
-
-        Args:
-            phonemes: instructions for how to make the mouth on a device move
-        """
-        try:
-            rec = json.dumps(phonemes)
-            with open(self.path, "w") as phoneme_file:
-                phoneme_file.write(rec)
-        except Exception:
-            LOG.error(f"Failed to write {self.name} to cache")
-
-    def exists(self):
-        return self.path.exists()
-
-
-class TextToSpeechCache:
-    """Class for all persistent and temporary caching operations."""
-    def __init__(self, tts_config, tts_name, audio_file_type):
-        self.config = tts_config
-        self.tts_name = tts_name
-        if "preloaded_cache" in self.config:
-            self.persistent_cache_dir = Path(self.config["preloaded_cache"])
-            ensure_directory_exists(
-                str(self.persistent_cache_dir), permissions=0o755
-            )
-        else:
-            self.persistent_cache_dir = None
-        self.temporary_cache_dir = Path(
-            get_cache_directory("tts/" + tts_name)
-        )
-        ensure_directory_exists(
-            str(self.temporary_cache_dir), permissions=0o755
-        )
-        self.audio_file_type = audio_file_type
-        self.resource_dir = Path(__file__).parent.parent.joinpath("res")
-        self.cached_sentences = {}
-        # curate cache if disk usage is above min %
-        self.min_free_percent = self.config.get("min_free_percent", 75)
-
-    def __contains__(self, sha):
-        """The cache contains a SHA if it knows of it and it exists on disk."""
-        if sha not in self.cached_sentences:
-            return False  # Doesn't know of it
-        else:
-            # Audio file must exist, phonemes are optional.
-            audio, phonemes = self.cached_sentences[sha]
-            return (audio.exists() and
-                    (phonemes is None or phonemes.exists()))
-
-    def load_persistent_cache(self):
-        """Load the contents of dialog files to the persistent cache directory.
-
-        Parse the dialog files in the resource directory into sentences.  Then
-        add the audio for each sentence to the cache directory.
-
-        NOTE: There may be files pre-loaded in the persistent cache directory
-        prior to run time, such as pre-recorded audio files.  This will add
-        files that do not already exist.
-
-        ANOTHER NOTE:  Mimic2 is the only TTS engine that supports
-        downloading missing files. This logic will need to change if another
-        TTS engine implements it.
-        """
-        if self.persistent_cache_dir is not None:
-            LOG.info("Adding dialog resources to persistent TTS cache...")
-            self._load_existing_audio_files()
-            self._load_existing_phoneme_files()
-            dialogs = self._collect_dialogs()
-            sentences = self._parse_dialogs(dialogs)
-            for sentence in sentences:
-                self._load_sentence(sentence)
-            LOG.info("Persistent TTS cache files added successfully.")
-
-    def _load_existing_audio_files(self):
-        """Find the TTS audio files already in the persistent cache."""
-        glob_pattern = "*." + self.audio_file_type
-        for file_path in self.persistent_cache_dir.glob(glob_pattern):
-            sentence_hash = file_path.name.split(".")[0]
-            audio_file = AudioFile(
-                self.persistent_cache_dir, sentence_hash, self.audio_file_type
-            )
-            self.cached_sentences[sentence_hash] = audio_file, None
-
-    def _load_existing_phoneme_files(self):
-        """Find the TTS phoneme files already in the persistent cache.
-
-        A phoneme file is no good without an audio file to pair it with.  If
-        no audio file matches, do not load the phoneme.
-        """
-        for file_path in self.persistent_cache_dir.glob("*.pho"):
-            sentence_hash = file_path.name.split(".")[0]
-            cached_sentence = self.cached_sentences.get(sentence_hash)
-            if cached_sentence is not None:
-                audio_file = cached_sentence[0]
-                phoneme_file = PhonemeFile(
-                    self.persistent_cache_dir, sentence_hash
-                )
-                self.cached_sentences[sentence_hash] = audio_file, phoneme_file
-
-    def _collect_dialogs(self) -> List:
-        """Build a set of unique sentences from the dialog files.
-
-        The sentences will be parsed from *.dialog files present in
-        mycroft/res/text/en-us.
-        """
-        dialogs = []
-        dialog_directory = Path(self.resource_dir, "text", "en-us")
-        for dialog_file_path in dialog_directory.glob("*.dialog"):
-            with open(dialog_file_path) as dialog_file:
-                for dialog in dialog_file.readlines():
-                    dialogs.append(dialog.strip())
-
-        return dialogs
-
-    @staticmethod
-    def _parse_dialogs(dialogs: List[str]) -> Set[str]:
-        """Split each dialog in the resources directory into sentences.
-
-        Do not consider sentences with special characters other than
-        punctuation
-            example : <<< LOADING <<<
-
-        Args:
-            dialogs: a list of the records in the dialog resource files
-        """
-        sentences = set()
-        dialog_split_regex = r"(?<=\.|\;|\?)\s"
-        special_characters_regex = re.compile(r"[@#$%^*()<>/|}{~:]")
-        for dialog in dialogs:
-            dialog_sentences = re.split(dialog_split_regex, dialog)
-            for sentence in dialog_sentences:
-                match = special_characters_regex.search(sentence)
-                if match is None:
-                    sentences.add(sentence)
-
-        return sentences
-
-    def _load_sentence(self, sentence: str):
-        """Build audio and phoneme files for each sentence to be cached.
-
-        Perform TTS inference on sentences parsed from dialog files.  Store
-        the results in the persistent cache directory.
-
-        ASSUMPTION: The only TTS that supports persistent cache right now is
-        Mimic2.  This method assumes a call to the Mimic2 API.  If other TTS
-        engines want to take advantage of the persistent cache, this logic
-        will need to be more dynamic.
-        """
-        # TODO support multiple engines
-        if self.tts_name != "Mimic2":
-            return
-
-        sentence_hash = hash_sentence(sentence)
-        if sentence_hash not in self.cached_sentences:
-            LOG.info("Adding \"{}\" to cache".format(sentence))
-            try:
-                mimic2_url = self.config["url"]
-                audio, phonemes = _get_mimic2_audio(sentence, mimic2_url)
-            except Exception:
-                log_msg = "Failed to get audio for sentence \"{}\""
-                LOG.exception(log_msg.format(sentence))
-            else:
-                self._add_to_persistent_cache(sentence_hash, audio, phonemes)
-
-    def _add_to_persistent_cache(
-            self, sentence_hash: str, audio: bytes, phonemes: str
-    ):
-        """Add a audio/phoneme file pair to the persistent cache."""
-        audio_file = AudioFile(
-            self.persistent_cache_dir, sentence_hash, self.audio_file_type
-        )
-        audio_file.save(audio)
-        if phonemes is None:
-            phoneme_file = None
-        else:
-            phoneme_file = PhonemeFile(
-                self.persistent_cache_dir, sentence_hash
-            )
-            phoneme_file.save(phonemes)
-        self.cached_sentences[sentence_hash] = audio_file, phoneme_file
-
-    def clear(self):
-        """Remove all files from the temporary cache."""
-        for cache_file_path in self.temporary_cache_dir.iterdir():
-            if cache_file_path.is_dir():
-                for sub_path in cache_file_path.iterdir():
-                    if sub_path.is_file():
-                        sub_path.unlink()
-            elif cache_file_path.is_file():
-                cache_file_path.unlink()
-
-    def curate(self):
-        """Remove cache data if disk space is running low."""
-        files_removed = curate_cache(self.temporary_cache_dir,
-                                     min_free_percent=self.min_free_percent)
-
-        hashes = set([hash_from_path(Path(path)) for path in files_removed])
-        for sentence_hash in hashes:
-            if sentence_hash in self.cached_sentences:
-                self.cached_sentences.pop(sentence_hash)
-
-    def define_audio_file(self, sentence_hash: str) -> AudioFile:
-        """Build an instance of an object representing an audio file."""
-        audio_file = AudioFile(
-            self.temporary_cache_dir, sentence_hash, self.audio_file_type
-        )
-        return audio_file
-
-    def define_phoneme_file(self, sentence_hash: str) -> PhonemeFile:
-        """Build an instance of an object representing an phoneme file."""
-        phoneme_file = PhonemeFile(self.temporary_cache_dir, sentence_hash)
-        return phoneme_file
+NOTE: this is dead code! do not use!
+This file is only present to ensure backwards compatibility
+in case someone is importing from here
+This is only meant for 3rd party code expecting ovos-core
+to be a drop in replacement for mycroft-core
+"""
+from ovos_plugin_manager.utils.tts_cache import hash_sentence, hash_from_path,\
+    AudioFile, PhonemeFile, TextToSpeechCache