Files
VoiceRSSSummary/services/tts.ts
2025-06-07 14:44:58 +09:00

145 lines
4.1 KiB
TypeScript

import fs from "fs";
import path from "path";
import ffmpegPath from "ffmpeg-static";
import { config } from "./config.js";
interface VoiceStyle {
styleId: number;
}
// 環境変数からデフォルトの声設定を取得
const defaultVoiceStyle: VoiceStyle = {
styleId: config.voicevox.styleId,
};
/**
* Generate TTS without adding to retry queue on failure
* Used for retry queue processing to avoid infinite loops
*/
export async function generateTTSWithoutQueue(
itemId: string,
scriptText: string,
retryCount: number = 0,
): Promise<string> {
if (!itemId || itemId.trim() === "") {
throw new Error("Item ID is required for TTS generation");
}
if (!scriptText || scriptText.trim() === "") {
throw new Error("Script text is required for TTS generation");
}
console.log(`TTS生成開始: ${itemId} (試行回数: ${retryCount + 1})`);
const encodedText = encodeURIComponent(scriptText);
const queryUrl = `${config.voicevox.host}/audio_query?text=${encodedText}&speaker=${defaultVoiceStyle.styleId}`;
const synthesisUrl = `${config.voicevox.host}/synthesis?speaker=${defaultVoiceStyle.styleId}`;
const queryResponse = await fetch(queryUrl, {
method: "POST",
headers: {
"Content-Type": "application/json",
Accept: "application/json",
},
});
if (!queryResponse.ok) {
const errorText = await queryResponse.text();
throw new Error(
`VOICEVOX audio query failed (${queryResponse.status}): ${errorText}`,
);
}
const audioQuery = await queryResponse.json();
console.log(`音声合成開始: ${itemId}`);
const audioResponse = await fetch(synthesisUrl, {
method: "POST",
headers: {
"Content-Type": "application/json",
},
body: JSON.stringify(audioQuery),
signal: AbortSignal.timeout(600000), // 10分のタイムアウト
});
if (!audioResponse.ok) {
const errorText = await audioResponse.text();
console.error(`音声合成失敗: ${itemId}`);
throw new Error(
`VOICEVOX synthesis failed (${audioResponse.status}): ${errorText}`,
);
}
const audioArrayBuffer = await audioResponse.arrayBuffer();
const audioBuffer = Buffer.from(audioArrayBuffer);
// 出力ディレクトリの準備
const outputDir = config.paths.podcastAudioDir;
if (!fs.existsSync(outputDir)) {
fs.mkdirSync(outputDir, { recursive: true });
}
const wavFilePath = path.resolve(outputDir, `${itemId}.wav`);
const mp3FilePath = path.resolve(outputDir, `${itemId}.mp3`);
console.log(`WAVファイル保存開始: ${wavFilePath}`);
fs.writeFileSync(wavFilePath, audioBuffer);
console.log(`WAVファイル保存完了: ${wavFilePath}`);
console.log(`MP3変換開始: ${wavFilePath} -> ${mp3FilePath}`);
const ffmpegCmd = ffmpegPath || "ffmpeg";
const result = Bun.spawnSync({
cmd: [
ffmpegCmd,
"-i",
wavFilePath,
"-codec:a",
"libmp3lame",
"-qscale:a",
"2",
"-y", // Overwrite output file
mp3FilePath,
],
});
if (result.exitCode !== 0) {
const stderr = result.stderr
? new TextDecoder().decode(result.stderr)
: "Unknown error";
throw new Error(`FFmpeg conversion failed: ${stderr}`);
}
// Wavファイルを削除
if (fs.existsSync(wavFilePath)) {
fs.unlinkSync(wavFilePath);
}
console.log(`TTS生成完了: ${itemId}`);
return path.basename(mp3FilePath);
}
export async function generateTTS(
itemId: string,
scriptText: string,
retryCount: number = 0,
): Promise<string> {
const maxRetries = 2;
try {
return await generateTTSWithoutQueue(itemId, scriptText, retryCount);
} catch (error) {
console.error(`TTS生成エラー: ${itemId} (試行回数: ${retryCount + 1})`, error);
if (retryCount < maxRetries) {
// Add to queue for retry only on initial failure
const { addToQueue } = await import("../services/database.js");
await addToQueue(itemId, scriptText, retryCount);
throw new Error(`TTS generation failed, added to retry queue: ${error}`);
} else {
throw new Error(`TTS generation failed after ${maxRetries + 1} attempts: ${error}`);
}
}
}