Merge 1261b8e into 47af401

seanbudd · web-flow · commit 700ad28992cd · 2022-06-09T13:00:46.000+10:00
diff --git a/source/speech/manager.py b/source/speech/manager.py
@@ -331,15 +331,6 @@ def _processSpeechSequence(self, inSeq: SpeechSequence):
 
 		outSeq = []
 		for command in inSeq:
-			if isinstance(command, LangChangeCommand) and currentSynth.name == 'oneCore':
-				langCode = command.lang.split('_')[0]
-				langSupported = False
-				currentSynthLanguages = currentSynth.availableLanguages
-				for lang in currentSynthLanguages:
-					if lang and normalizeLanguage(lang).split('_')[0] == langCode:
-						langSupported = True
-				if not langSupported:
-					log.warning(f"Language {command.lang} not supported by {currentSynth.name} ({currentSynthLanguages})")
 			if isinstance(command, BaseCallbackCommand):
 				# When the synth reaches this point, we want to call the callback.
 				speechIndex = next(self._indexCounter)
diff --git a/source/speechXml.py b/source/speechXml.py
@@ -1,5 +1,5 @@
 # A part of NonVisual Desktop Access (NVDA)
-# Copyright (C) 2016-2021 NV Access Limited
+# Copyright (C) 2016-2022 NV Access Limited
 # This file is covered by the GNU General Public License.
 # See the file COPYING for more details.
 
@@ -14,7 +14,7 @@
 import re
 import speech
 import textUtils
-from speech.commands import SpeechCommand
+from speech.commands import LangChangeCommand, SpeechCommand
 from logHandler import log
 
 XML_ESCAPES = {
@@ -49,7 +49,8 @@ def _buildInvalidXmlRegexp():
 RE_INVALID_XML_CHARS = _buildInvalidXmlRegexp()
 REPLACEMENT_CHAR = textUtils.REPLACEMENT_CHAR
 
-def toXmlLang(nvdaLang):
+
+def toXmlLang(nvdaLang: str) -> str:
 	"""Convert an NVDA language to an XML language.
 	"""
 	return nvdaLang.replace("_", "-")
@@ -153,7 +154,7 @@ def _outputTags(self):
 			self._openTags.append(tag)
 		self._tagsChanged = False
 
-	def generateXml(self, commands):
+	def generateXml(self, commands) -> str:
 		"""Generate XML from a sequence of balancer commands and text.
 		"""
 		for command in commands:
@@ -235,7 +236,7 @@ class SsmlConverter(SpeechXmlConverter):
 	"""Converts an NVDA speech sequence to SSML.
 	"""
 
-	def __init__(self, defaultLanguage):
+	def __init__(self, defaultLanguage: str):
 		self.defaultLanguage = toXmlLang(defaultLanguage)
 
 	def generateBalancerCommands(self, speechSequence):
@@ -254,7 +255,7 @@ def convertCharacterModeCommand(self, command):
 		else:
 			return StopEnclosingTextCommand()
 
-	def convertLangChangeCommand(self, command):
+	def convertLangChangeCommand(self, command: LangChangeCommand) -> SetAttrCommand:
 		lang = command.lang or self.defaultLanguage
 		lang = toXmlLang(lang)
 		return SetAttrCommand("voice", "xml:lang", lang)
diff --git a/source/synthDrivers/oneCore.py b/source/synthDrivers/oneCore.py
@@ -7,7 +7,7 @@
 """
 
 import os
-import sys
+from typing import Any, Callable, Generator, List, Optional, Set, Tuple, Union
 from collections import OrderedDict
 import ctypes
 import winreg
@@ -25,6 +25,7 @@
 import config
 import nvwave
 import queueHandler
+from speech.types import SpeechSequence
 import speech
 import speechXml
 import languageHandler
@@ -47,6 +48,14 @@
 ocSpeech_Callback = ctypes.CFUNCTYPE(None, ctypes.c_void_p, ctypes.c_int, ctypes.c_wchar_p)
 
 class _OcSsmlConverter(speechXml.SsmlConverter):
+	def __init__(
+			self,
+			defaultLanguage: str,
+			availableLanguages: Set[str],
+	):
+		self.lowerCaseAvailableLanguages = {language.lower() for language in availableLanguages}
+		self.availableLanguagesWithoutLocale = {language.split("_")[0] for language in self.lowerCaseAvailableLanguages}
+		super().__init__(defaultLanguage)
 
 	def _convertProsody(self, command, attr, default, base=None):
 		if base is None:
@@ -74,23 +83,40 @@ def convertCharacterModeCommand(self, command):
 		# Therefore, we don't use it.
 		return None
 
-	def convertLangChangeCommand(self, command):
+	def convertLangChangeCommand(self, command: LangChangeCommand) -> Optional[speechXml.SetAttrCommand]:
 		lcid = languageHandler.localeNameToWindowsLCID(command.lang)
 		if lcid is languageHandler.LCID_NONE:
 			log.debugWarning(f"Invalid language: {command.lang}")
 			return None
+
+		normalizedLanguage = command.lang.lower().replace("-", "_")
+		normalizedLanguageWithoutLocale = normalizedLanguage.split("_")[0]
+		if (
+			normalizedLanguage not in self.lowerCaseAvailableLanguages
+			and normalizedLanguageWithoutLocale not in self.availableLanguagesWithoutLocale
+		):
+			log.warning(f"Language {command.lang} not supported ({self.lowerCaseAvailableLanguages})")
+			return None
+
 		return super().convertLangChangeCommand(command)
 
 class _OcPreAPI5SsmlConverter(_OcSsmlConverter):
 
-	def __init__(self, defaultLanguage, rate, pitch, volume):
-		super(_OcPreAPI5SsmlConverter, self).__init__(defaultLanguage)
+	def __init__(
+			self,
+			defaultLanguage: str,
+			availableLanguages: Set[str],
+			rate: float,
+			pitch: float,
+			volume: float,
+	):
+		super().__init__(defaultLanguage, availableLanguages)
 		self._rate = rate
 		self._pitch = pitch
 		self._volume = volume
 
-	def generateBalancerCommands(self, speechSequence):
-		commands = super(_OcPreAPI5SsmlConverter, self).generateBalancerCommands(speechSequence)
+	def generateBalancerCommands(self, speechSequence: SpeechSequence) -> Generator[Any, None, None]:
+		commands = super().generateBalancerCommands(speechSequence)
 		# The EncloseAllCommand from SSML must be first.
 		yield next(commands)
 		# OneCore didn't provide a way to set base prosody values before API version 5.
@@ -135,6 +161,9 @@ class OneCoreSynthDriver(SynthDriver):
 	}
 	supportedNotifications = {synthIndexReached, synthDoneSpeaking}
 
+	_ocSpeechToken: Optional[ctypes.POINTER]
+	_queuedSpeech: List[Union[str, Tuple[Callable[[ctypes.POINTER, float], None], float]]]
+
 	@classmethod
 	def check(cls):
 		# Only present this as an available synth if this is Windows 10.
@@ -235,11 +264,17 @@ def cancel(self):
 		if self._player:
 			self._player.stop()
 
-	def speak(self, speechSequence):
+	def speak(self, speechSequence: SpeechSequence) -> None:
 		if self.supportsProsodyOptions:
-			conv = _OcSsmlConverter(self.language)
+			conv = _OcSsmlConverter(self.language, self.availableLanguages)
 		else:
-			conv = _OcPreAPI5SsmlConverter(self.language, self._rate, self._pitch, self._volume)
+			conv = _OcPreAPI5SsmlConverter(
+				self.language,
+				self.availableLanguages,
+				self._rate,
+				self._pitch,
+				self._volume
+			)
 		text = conv.convertToXml(speechSequence)
 		# #7495: Calling WaveOutOpen blocks for ~100 ms if called from the callback
 		# when the SSML includes marks.
@@ -249,7 +284,7 @@ def speak(self, speechSequence):
 			self._player.open()
 		self._queueSpeech(text)
 
-	def _queueSpeech(self, item):
+	def _queueSpeech(self, item: str) -> None:
 		self._queuedSpeech.append(item)
 		# We only process the queue here if it isn't already being processed.
 		if not self._isProcessing:
@@ -433,7 +468,8 @@ def _getVoiceInfoFromOnecoreVoiceString(self, voiceStr):
 	def _getAvailableVoices(self):
 		voices = OrderedDict()
 		# Fetch the full list of voices that Onecore speech knows about.
-		# Note that it may give back voices that are uninstalled or broken. 
+		# Note that it may give back voices that are uninstalled or broken.
+		# Refer to _isVoiceValid for information on uninstalled or broken voices.
 		voicesStr = self._dll.ocSpeech_getVoices(self._ocSpeechToken).split('|')
 		for index,voiceStr in enumerate(voicesStr):
 			voiceInfo=self._getVoiceInfoFromOnecoreVoiceString(voiceStr)
@@ -444,14 +480,26 @@ def _getAvailableVoices(self):
 			voices[voiceInfo.id] =  voiceInfo
 		return voices
 
-	def _isVoiceValid(self,ID):
-		"""
+	def _isVoiceValid(self, ID: str) -> bool:
+		r"""
 		Checks that the given voice actually exists and is valid.
 		It checks the Registry, and also ensures that its data files actually exist on this machine.
 		@param ID: the ID of the requested voice.
-		@type ID: string
-		@returns: True if the voice is valid, false otherwise.
-		@rtype: boolean
+		@returns: True if the voice is valid, False otherwise.
+
+		OneCore keeps specific registry caches of OneCore for AT applications.
+		NVDA's OneCore cache is: `HKEY_CURRENT_USER\Software\Microsoft\Speech_OneCore\Isolated\Ny37kw9G-o42UiJ1z6Qc_sszEKkCNywTlrTOG0QKVB4`.
+		The caches contain a subtree which is meant to mirror the path `HKEY_LOCAL_MACHINE\SOFTWARE\Microsoft\Speech_OneCore\*`.
+
+		For example
+		`HKEY_CURRENT_USER\Software\Microsoft\Speech_OneCore\Isolated\Ny37kw9G-o42UiJ1z6Qc_sszEKkCNywTlrTOG0QKVB4\
+		HKEY_LOCAL_MACHINE\SOFTWARE\Microsoft\Speech_OneCore\Voices\Tokens\MSTTS_V110_enUS_MarkM`
+		refers to `HKEY_LOCAL_MACHINE\SOFTWARE\Microsoft\Speech_OneCore\Voices\Tokens\MSTTS_V110_enUS_MarkM`.
+
+		Languages which have been used by an installed copy of NVDA, but uninstalled from the system are kept in the cache.
+		OneCore will still attempt to use these languages, so we must check if they are valid first.
+
+		Refer to https://github.com/nvaccess/nvda/issues/13732#issuecomment-1149386711 for more information.
 		"""
 		IDParts = ID.split('\\')
 		rootKey = getattr(winreg, IDParts[0])