MMAPI-2

Running

App Files Files Community

DeFactOfficial commited on Oct 26, 2024

Commit

996c544

verified ·

1 Parent(s): 477624d

Update api.js

Browse files

Files changed (1) hide show

api.js +4 -90

api.js CHANGED Viewed

@@ -202,97 +202,11 @@ app.post('api/generate/speech', async (req, res) =>{
 })
-// This is normal TTS: specify voice, text, model. Voices are from openai, use those names or the aliases in lookup table
-app.get('api/generate/utterance', async (req, res) => {
-  const {voice, text, model} = req.query
-  console.log("Utterance Params", {voice, text, model})
-  //const outputFilename= await generateAudio(voice, text, model || "tts-1")
-  // We want the browser to cache this response, because there's no reason to TTS the same text-voice-model combination more than once
-  //await res.sendFile(path.resolve(outputFilename), { headers: { 'Content-Type': 'audio/mpeg', 'Cache-Control':'Max-Age=8640000' } });
 })
-app.post('api/generate/utterance', async (req, res) =>{
-  const {voice, text, model} = req.body
-  const outputFilename= await generateAudio(voice, text, model || "tts-1")
-  // We want the browser to cache this response, because there's no reason to TTS the same text-voice-model combination more than once
-  res.sendFile(path.resolve(outputFilename), { headers: { 'Content-Type': 'audio/mpeg', 'Cache-Control':'Max-Age=8640000' } });
-})
-// This returns a stream of SSE (application/event-stream) similar to a streaming response from an LLM
-// See example in public/client for how to consume the stream
-app.post('/api/generate/speech/stream', async (req, res) => {
-  try {
-    const apiKey = req.query.api_key || 'their_api_key';
-    if (apiKey !== 'their_api_key') {
-      // Replace "their_api_key" with your actual method of managing API keys
-      res.status(401).send('Unauthorized');
-      return;
-    }
-    const script = req.body.payload;
-    if (!script) {
-      res.status(400).send('Bad Request: Missing payload');
-      return;
-    }
-    // Set headers for SSE
-    res.setHeader('Content-Type', 'text/event-stream');
-    res.setHeader('Cache-Control', 'no-cache');
-    res.setHeader('Connection', 'keep-alive');
-    const hash = crypto.createHash('sha1');
-    hash.update(script);
-    const scriptHash = hash.digest('hex');
-    if (audioCache[scriptHash]) {
-      // If audio is cached, send the final SSE with the combined audio URL
-      const filePath = audioCache[scriptHash];
-      console.log(filePath)
-      res.write(`event: audio_complete\ndata: ${req.protocol}://${req.get('host')}/${filePath}\n\n`);
-      res.end();
-      return;
-    }
-    const parsedSegments = parseScript(script);
-    const audioSegments = [];
-    for (const segment of parsedSegments) {
-      const audioPath = await generateAudio(segment.speaker_name, segment.content);
-      audioSegments.push(audioPath);
-      // Send SSE with the URL of the generated audio segment
-      res.write(`event: audio_segment\ndata: ${req.protocol}://${req.get('host')}/${audioPath}\n\n`);
-    }
-    if (audioSegments.length === 0) {
-      res.write(`event: error\ndata: No audio generated\n\n`);
-      res.end();
-      return;
-    }
-    // Concatenate audio files into one using FFmpeg
-    const combinedAudioPath = path.join(MEDIA_FOLDER, `combined_${uuidv4()}.mp3`);
-    await concatenateAudioFiles(audioSegments, combinedAudioPath);
-    audioCache[scriptHash] = combinedAudioPath;
-    console.log(combinedAudioPath)
-    // Send SSE with the URL of the combined audio
-    res.write(`event: audio_complete\ndata: ${req.protocol}://${req.get('host')}/${combinedAudioPath}\n\n`);
-    res.end();
-  } catch (error) {
-    console.error('Error generating speech:', error);
-    res.write(`event: error\ndata: Internal Server Error\n\n`);
-    res.end();
-  }
-});
 //Image generation parameters
 //response_format: image | url

 })
+app.get('/api/hello', async(req, res) => {
+  await res.status(200).send({"hello": "world"}, {headers: {"Content-Type":"application/json"}})
+  res.end()
 })
+// This is normal TTS: specify voice, text, model. Voices are from openai, use those names or the aliases in lookup table
 //Image generation parameters
 //response_format: image | url