sample WAV audio output for each voice included with OpenedAI Speech

3 months ago · a52bc15da5
12 changed files with 8 additions and 2 deletions
--- a/acosta.wav
+++ b/acosta.wav
--- a/assets/speech/news-alloy-alt.wav
+++ b/assets/speech/news-alloy-alt.wav
--- a/assets/speech/news-alloy.wav
+++ b/assets/speech/news-alloy.wav
--- a/assets/speech/news-fable.wav
+++ b/assets/speech/news-fable.wav
--- a/assets/speech/news-nova.wav
+++ b/assets/speech/news-nova.wav
--- a/assets/speech/news-onyx.wav
+++ b/assets/speech/news-onyx.wav
--- a/assets/speech/news-shimmer.wav
+++ b/assets/speech/news-shimmer.wav
--- a/assets/speech/speech-script
+++ b/assets/speech/speech-script
@ -0,0 +1 @@
+Hello. My name is Shimmer. I am one of the voices that ships with Opened AI Speech, and I'm happy to read the news for you today.
--- a/package.json
+++ b/package.json
@ -9,6 +9,7 @@
    "web-dev": "nodemon ./src/newsroom-web.ts",
    "start-worker": "node --import ./register.js --no-warnings ./src/workers/newsroom.ts",
    "worker-dev": "nodemon ./src/workers/newsroom.ts",
+    "speechgen": "node --import ./register.js --no-warnings ./src/speechgen.ts",
    "test": "echo \"Error: no test specified\" && exit 1"
  },
  "keywords": [
--- a/robc.wav
+++ b/robc.wav
--- a/src/app/services/openai.ts
+++ b/src/app/services/openai.ts
@ -40,6 +40,7 @@ export class OpenAiService extends DtpService {
    });
    this.homelabClient = new OpenAI({
      baseURL: env.apis.openai.homelab.baseURL,
+      apiKey: "unused",
    });
  }

@ -138,12 +139,14 @@ export class OpenAiService extends DtpService {

  async generateSpeech (input: string, model: string, voice: SpeechVoice) : Promise<IGeneratedFile> {
    const audioId = new Types.ObjectId();
-    const audioFile = path.join(env.root, audioId.toString());
+    const audioFile = path.join(env.root, `${audioId.toString()}.wav`);
    
    const response = await this.homelabClient.audio.speech.create({
      input,
      model,
-      voice
+      voice,
+      response_format: "wav",
+      speed: 1.0,
    });
    if (!response.ok) {
      throw new WebError(response.status, `failed to generate speech audio: ${response.statusText}`);
--- a/src/speechgen.ts
+++ b/src/speechgen.ts
@ -39,6 +39,7 @@ class SpeechGenerator extends DtpProcess {
  try {
    console.log("Speech Generator: A command line tool to generate audio");
    const generator = new SpeechGenerator();
+    await generator.start();

    const model = process.argv[2];
    assert(model, "Must specify model (tts-1, tts-1-hd)");
			`@ -0,0 +1 @@`
			`Hello. My name is Shimmer. I am one of the voices that ships with Opened AI Speech, and I'm happy to read the news for you today.`