Mushmou · rubynguyen1510 · Aug 1, 2023 · Jul 31, 2023 · Jul 31, 2023 · Aug 1, 2023
diff --git a/python/text-to-speech/main.py b/python/text-to-speech/main.py
@@ -101,9 +101,11 @@ def validate_request(self, req: requests) -> None:
 
     def get_token(self, subscription_key):
         """Grabs token with subscription key for Azure."""
-        fetch_token_url = 'https://westus.api.cognitive.microsoft.com/sts/v1.0/issuetoken'
+        fetch_token_url = (
+            "https://westus.api.cognitive.microsoft.com/sts/v1.0/issuetoken"
+        )
         headers = {
-            'Ocp-Apim-Subscription-Key': subscription_key
+            "Ocp-Apim-Subscription-Key": subscription_key
         }
         response = requests.post(fetch_token_url, headers=headers, timeout=10)
         access_token = str(response.text)
@@ -120,15 +122,27 @@ def speech(self, text: str, language: str) -> bytes:
         Returns:
             bytes: The synthezied speech in bytes.
         """
-        url = f"https://{self.region_key}.tts.speech.microsoft.com/cognitiveservices/v1"
+        url = (
+            f"https://{self.region_key}."
+            f"tts.speech.microsoft.com/cognitiveservices/v1"
+        )
         headers_azure = {
-            'Content-type': 'application/ssml+xml',
-            # 'Ocp-Apim-Subscription-Key': self.api_key,
-            'Authorization': 'Bearer ' + self.get_token(self.api_key),
-            'X-Microsoft-OutputFormat': 'audio-16khz-32kbitrate-mono-mp3',
+            "Content-type": "application/ssml+xml",
+            "Authorization": "Bearer " + self.get_token(self.api_key),
+            "X-Microsoft-OutputFormat": "audio-16khz-32kbitrate-mono-mp3",
         }
-        data_azure = f"<speak version='1.0' xml:lang='{language}'><voice xml:lang='{language}' xml:gender='Male' name='en-US-ChristopherNeural'>{text}</voice></speak>"
-        response = requests.request("POST", url, headers=headers_azure, data=data_azure, timeout=10)
+        data_azure = (
+            f"<speak version='1.0' xml:lang='{language}'><voice"
+            f"xml:lang='{language}' xml:gender='Male'"
+            f"name='en-US-ChristopherNeural'>{text}</voice></speak>"
+        )
+        response = requests.request(
+            "POST",
+            url,
+            headers=headers_azure,
+            data=data_azure,
+            timeout=10,
+        )
         response.raise_for_status()
         return response.content
 

diff --git a/python/text-to-speech/requirements.txt b/python/text-to-speech/requirements.txt
@@ -1,4 +1,5 @@
 boto3==1.28.9
 google-cloud-texttospeech==2.14.1
+# azure-cognitiveservices-speech==1.30.0
 parameterized==0.9.0
 requests==2.31.0
diff --git a/python/text-to-speech/test_main.py b/python/text-to-speech/test_main.py
@@ -207,6 +207,7 @@ def get_aws_instance(self, key, secret_key):
         (None, None),  # Missing Both
     ])
     def test_validate_request(self, key, secret_key):
+
         self.assertRaises(ValueError, self.get_aws_instance, key, secret_key)
 
     def test_speech_happy(self):