Spaces:

gnilets
/

tts

Running

App Files Files Community

gnilets commited on Sep 25, 2024

Commit

65919e0

verified ·

1 Parent(s): bf1867d

Update main.ts

Browse files

Files changed (1) hide show

main.ts +117 -166

main.ts CHANGED Viewed

@@ -1,127 +1,92 @@
-import { serve } from "https://deno.land/std/http/server.ts";
-import { EdgeSpeechTTS } from "https://esm.sh/@lobehub/tts@1";
-const VOICES_URL = "https://speech.platform.bing.com/consumer/speech/synthesize/readaloud/voices/list?trustedclienttoken=6A5AA1D4EAFF4E9FB37E23D68491D6F4";
-async function fetchVoiceList() {
-  const response = await fetch(VOICES_URL);
-  const voices = await response.json();
-  return voices.reduce((acc: Record<string, { model: string, name: string, friendlyName: string, locale: string }[]>, voice: any) => {
-    const { ShortName: model, ShortName: name, FriendlyName: friendlyName, Locale: locale } = voice;
-    if (!acc[locale]) acc[locale] = [];
-    acc[locale].push({ model, name, friendlyName, locale });
-    return acc;
-  }, {});
-}
 async function synthesizeSpeech(model: string, voice: string, text: string) {
-  let voiceName;
-  let rate = 0;
-  let pitch = 0;
-  if (!model.includes("Neural")) {
-    switch (model) {
-      case "ava":
-        voiceName = "en-US-AvaMultilingualNeural";
-        break;
-      case "andrew":
-        voiceName = "en-US-AndrewMultilingualNeural";
-        break;
-      case "emma":
-        voiceName = "en-US-EmmaMultilingualNeural";
-        break;
-      case "brian":
-        voiceName = "en-US-BrianMultilingualNeural";
-        break;
-      case "vivienne":
-        voiceName = "fr-FR-VivienneMultilingualNeural";
-        break;
-      case "remy":
-        voiceName = "fr-FR-RemyMultilingualNeural";
-        break;
-      case "seraphina":
-        voiceName = "de-DE-SeraphinaMultilingualNeural";
-        break;
-      case "florian":
-        voiceName = "de-DE-FlorianMultilingualNeural";
-        break;
-      case "dmitry":
-        voiceName = "ru-RU-DmitryNeural";
-        break;
-      case "svetlana":
-        voiceName = "ru-RU-SvetlanaNeural";
-        break;
-      default:
-        voiceName = "en-US-BrianMultilingualNeural";
-        break;
     }
-  } else {
-    voiceName = model;
-    const params = Object.fromEntries(
-      voice.split("|").map((p) => p.split(":") as [string, string])
-    );
-    rate = Number(params["rate"] || 0);
-    pitch = Number(params["pitch"] || 0);
-  }
-  const tts = new EdgeSpeechTTS();
-  const payload = {
-    input: text,
-    options: {
-      rate: rate,
-      pitch: pitch,
-      voice: voiceName
-     },
-  };
-  const response = await tts.create(payload);
-  const mp3Buffer = new Uint8Array(await response.arrayBuffer());
-  console.log(`Successfully synthesized speech, returning audio/mpeg response`);
-  return new Response(mp3Buffer, {
-    headers: { "Content-Type": "audio/mpeg" },
-  });
 }
 function validateContentType(req: Request, expected: string) {
-  const contentType = req.headers.get("Content-Type");
-  if (contentType !== expected) {
-    console.log(`Invalid Content-Type ${contentType}, expected ${expected}`);
-    return new Response("Bad Request", { status: 400 });
-  }
 }
-async function handleDebugRequest(req: Request) {
-  const url = new URL(req.url);
-  const voice = url.searchParams.get("voice") || "";
-  const model = url.searchParams.get("model") || "";
-  const text = url.searchParams.get("text") || "";
-  console.log(`Debug request with model=${model}, voice=${voice}, text=${text}`);
-  if (!voice || !model || !text) {
-    console.log("Missing required parameters");
-    return new Response("Bad Request", { status: 400 });
-  }
-  return synthesizeSpeech(model, voice, text);
 }
 async function handleSynthesisRequest(req: Request) {
-  if (req.method !== "POST") {
-    console.log(`Invalid method ${req.method}, expected POST`);
-    return new Response("Method Not Allowed", { status: 405 });
-  }
-  const invalidContentType = validateContentType(req, "application/json");
-  if (invalidContentType) return invalidContentType;
-  const { model, input, voice } = await req.json();
-  console.log(`Synthesis request with model=${model}, input=${input}, voice=${voice}`);
-  return synthesizeSpeech(model, voice, input);
 }
@@ -225,12 +190,12 @@ async function handleDemoRequest(req: Request) {
   }
   #audioPlayerContainer {
-    text-align: center; /* Центрируем содержимое контейнера */
   }
   audio {
     width: 100%;
-    max-width: 600px; /* Ограничиваем максимальную ширину плеера */
     margin: 10px 0;
   }
@@ -283,18 +248,15 @@ async function handleDemoRequest(req: Request) {
         const audioUrl = URL.createObjectURL(blob);
         const audioPlayerContainer = document.getElementById('audioPlayerContainer');
-        // Удаляем старый аудиоплеер, если он существует
         if (audio) {
             audio.pause();
             audioPlayerContainer.innerHTML = '';
         }
-        // Создаем новый аудиоплеер
         audio = new Audio(audioUrl);
         audio.controls = true;
         audioPlayerContainer.appendChild(audio);
-        // Создаем ссылку для скачивания
         const downloadLink = document.createElement('a');
         downloadLink.href = audioUrl;
         downloadLink.download = 'synthesized_voice.mp3';
@@ -302,10 +264,7 @@ async function handleDemoRequest(req: Request) {
         downloadLink.style.display = 'block';
         downloadLink.style.marginTop = '10px';
-        // Добавляем ссылку для скачивания в контейнер
         audioPlayerContainer.appendChild(downloadLink);
-        // Воспроизводим аудио
         audio.play();
     });
@@ -324,7 +283,7 @@ async function handleDemoRequest(req: Request) {
             voiceSelect.appendChild(option);
           });
         } catch (error) {
-          console.error('Ошибка при получении списка моделей:', error);
         }
       }
@@ -334,61 +293,53 @@ async function handleDemoRequest(req: Request) {
  </body></html>`;
     return new Response(html, {
-      headers: { "Content-Type": "text/html" },
     });
 }
 async function handleVoiceList() {
-  let voices = [
-    {model: 'ava', gender: 'female'},
-    {model: 'andrew', gender: 'male'},
-    {model: 'emma', gender: 'female'},
-    {model: 'brian', gender: 'male'},
-    {model: 'vivienne', gender: 'female'},
-    {model: 'remy', gender: 'male'},
-    {model: 'seraphina', gender: 'female'},
-    {model: 'florian', gender: 'male'},
-    {model: 'dmitry', gender: 'male'},
-    {model: 'svetlana', gender: 'female'}
-  ];
-  const sortedVoiceList = voices.sort((a, b) => {
-    if (a.gender === 'male' && b.gender === 'female') return -1;
-    if (a.gender === 'female' && b.gender === 'male') return 1;
-    return 0;
-  });
-  return new Response(JSON.stringify(sortedVoiceList), {
-    headers: { "Content-Type": "application/json" },
-  });
 }
 serve(async (req) => {
-  try {
-    const url = new URL(req.url);
-    if (url.pathname === "/") {
-      return handleDemoRequest(req);
-    }
-    if (url.pathname === "/v1/audio/models") {
-      return handleVoiceList();
-    }
-    if (url.pathname === "/tts") {
-      return handleDebugRequest(req);
-    }
-    if (url.pathname !== "/v1/audio/speech") {
-      console.log(`Unhandled path ${url.pathname}`);
-      return new Response("Not Found", { status: 404 });
-    }
-    return handleSynthesisRequest(req);
-  } catch (err) {
-    console.error(`Error processing request: ${err.message}`);
-    return new Response(`Internal Server Error\n${err.message}`, {
-      status: 500,
-    });
-  }
 });

+import {serve} from "https://deno.land/std/http/server.ts";
+import {EdgeSpeechTTS} from "https://esm.sh/@lobehub/tts@1";
 async function synthesizeSpeech(model: string, voice: string, text: string) {
+    let voiceName;
+    let rate = 0;
+    let pitch = 0;
+    if (!model.includes("Neural")) {
+        switch (model) {
+            case "ava":
+                voiceName = "en-US-AvaMultilingualNeural";
+                break;
+            case "andrew":
+                voiceName = "en-US-AndrewMultilingualNeural";
+                break;
+            case "emma":
+                voiceName = "en-US-EmmaMultilingualNeural";
+                break;
+            case "brian":
+                voiceName = "en-US-BrianMultilingualNeural";
+                break;
+            case "vivienne":
+                voiceName = "fr-FR-VivienneMultilingualNeural";
+                break;
+            case "remy":
+                voiceName = "fr-FR-RemyMultilingualNeural";
+                break;
+            case "seraphina":
+                voiceName = "de-DE-SeraphinaMultilingualNeural";
+                break;
+            case "florian":
+                voiceName = "de-DE-FlorianMultilingualNeural";
+                break;
+            case "dmitry":
+                voiceName = "ru-RU-DmitryNeural";
+                break;
+            case "svetlana":
+                voiceName = "ru-RU-SvetlanaNeural";
+                break;
+            default:
+                voiceName = "en-US-BrianMultilingualNeural";
+                break;
+        }
+    } else {
+        voiceName = model;
+        const params = Object.fromEntries(voice.split("|").map((p) => p.split(":") as [string, string]));
+        rate = Number(params["rate"] || 0);
+        pitch = Number(params["pitch"] || 0);
     }
+    const tts = new EdgeSpeechTTS();
+    const payload = {
+        input: text, options: {
+            rate: rate, pitch: pitch, voice: voiceName
+        },
+    };
+    const response = await tts.create(payload);
+    const mp3Buffer = new Uint8Array(await response.arrayBuffer());
+    return new Response(mp3Buffer, {
+        headers: {"Content-Type": "audio/mpeg"},
+    });
 }
 function validateContentType(req: Request, expected: string) {
+    const contentType = req.headers.get("Content-Type");
+    if (contentType !== expected) {
+        console.log(`Invalid Content-Type ${contentType}, expected ${expected}`);
+        return new Response("Bad Request", {status: 400});
+    }
 }
+async function handleDebugRequest() {
+    const voice = "rate:0.0|pitch:0.0";
+    const model = "en-US-BrianMultilingualNeural";
+    const text = "Приветик! Надеюсь ты меня хорошо слышишь? Алё?!";
+    console.log(`model=${model}, voice=${voice}, text=${text}`);
+    return synthesizeSpeech(model, voice, text);
 }
 async function handleSynthesisRequest(req: Request) {
+    if (req.method !== "POST") {
+        return new Response("Method Not Allowed", {status: 405});
+    }
+    const invalidContentType = validateContentType(req, "application/json");
+    if (invalidContentType) return invalidContentType;
+    const {model, input, voice} = await req.json();
+    return synthesizeSpeech(model, voice, input);
 }
   }
   #audioPlayerContainer {
+    text-align: center;
   }
   audio {
     width: 100%;
+    max-width: 600px;
     margin: 10px 0;
   }
         const audioUrl = URL.createObjectURL(blob);
         const audioPlayerContainer = document.getElementById('audioPlayerContainer');
         if (audio) {
             audio.pause();
             audioPlayerContainer.innerHTML = '';
         }
         audio = new Audio(audioUrl);
         audio.controls = true;
         audioPlayerContainer.appendChild(audio);
         const downloadLink = document.createElement('a');
         downloadLink.href = audioUrl;
         downloadLink.download = 'synthesized_voice.mp3';
         downloadLink.style.display = 'block';
         downloadLink.style.marginTop = '10px';
         audioPlayerContainer.appendChild(downloadLink);
         audio.play();
     });
             voiceSelect.appendChild(option);
           });
         } catch (error) {
+          console.error('ошибка при получении списка моделей:', error);
         }
       }
  </body></html>`;
     return new Response(html, {
+        headers: {"Content-Type": "text/html"},
     });
 }
 async function handleVoiceList() {
+    let voices = [{model: 'ava', gender: 'female'}, {model: 'andrew', gender: 'male'}, {model: 'emma', gender: 'female'}, {model: 'brian', gender: 'male'}, {model: 'vivienne', gender: 'female'}, {model: 'remy', gender: 'male'}, {
+        model: 'seraphina',
+        gender: 'female'
+    }, {model: 'florian', gender: 'male'}, {model: 'dmitry', gender: 'male'}, {model: 'svetlana', gender: 'female'}];
+    const sortedVoiceList = voices.sort((a, b) => {
+        if (a.gender === 'male' && b.gender === 'female') return -1;
+        if (a.gender === 'female' && b.gender === 'male') return 1;
+        return 0;
+    });
+    return new Response(JSON.stringify(sortedVoiceList), {
+        headers: {"Content-Type": "application/json"},
+    });
 }
 serve(async (req) => {
+    try {
+        const url = new URL(req.url);
+        if (url.pathname === "/") {
+            return handleDemoRequest(req);
+        }
+        if (url.pathname === "/v1/audio/models") {
+            return handleVoiceList();
+        }
+        if (url.pathname === "/tts") {
+            return handleDebugRequest();
+        }
+        if (url.pathname !== "/v1/audio/speech") {
+            console.log(`Unhandled path ${url.pathname}`);
+            return new Response("Not Found", {status: 404});
+        }
+        return handleSynthesisRequest(req);
+    } catch (err) {
+        console.error(`Error processing request: ${err.message}`);
+        return new Response(`Internal Server Error\n${err.message}`, {
+            status: 500,
+        });
+    }
 });