Work on tts

This commit is contained in:
Nikolaj Olsson 2024-04-13 07:36:17 +02:00
parent c0ed5acc33
commit 3fec01a167

View File

@ -21,6 +21,7 @@ namespace Nikse.SubtitleEdit.Forms.Tts
private string _waveFolder;
private readonly List<ActorAndVoice> _actorAndVoices;
private readonly SubtitleFormat _subtitleFormat;
private bool _abort;
public class ActorAndVoice
{
@ -92,14 +93,39 @@ namespace Nikse.SubtitleEdit.Forms.Tts
private void ButtonGenerateTtsClick(object sender, EventArgs e)
{
if (buttonGenerateTTS.Text == LanguageSettings.Current.General.Cancel)
{
buttonGenerateTTS.Enabled = false;
_abort = true;
Application.DoEvents();
return;
}
buttonGenerateTTS.Text = LanguageSettings.Current.General.Cancel;
_waveFolder = Path.Combine(Path.GetTempPath(), Guid.NewGuid().ToString());
Directory.CreateDirectory(_waveFolder);
GenerateParagraphAudio(_subtitle, true);
GenerateParagraphAudio(_subtitle, true, null);
if (_abort)
{
HandleAbort();
return;
}
var fileNames = FixParagraphAudioSpeed();
if (_abort)
{
HandleAbort();
return;
}
var tempAudioFile = MergeAudioParagraphs(fileNames);
if (_abort)
{
HandleAbort();
return;
}
// rename result file
var resultAudioFileName = Path.Combine(Path.GetDirectoryName(tempAudioFile), Path.GetFileNameWithoutExtension(_videoFileName) + ".wav");
@ -110,28 +136,49 @@ namespace Nikse.SubtitleEdit.Forms.Tts
if (checkBoxAddToVideoFile.Checked)
{
AddAudioToVideoFile(resultAudioFileName);
if (_abort)
{
HandleAbort();
return;
}
}
HandleAbort();
UiUtil.OpenFolder(_waveFolder);
}
private void GenerateParagraphAudio(Subtitle subtitle, bool showProgressBar)
private void HandleAbort()
{
buttonGenerateTTS.Enabled = false;
progressBar1.Visible = false;
labelProgress.Text = string.Empty;
if (_abort)
{
Cleanup(_waveFolder, string.Empty);
}
buttonGenerateTTS.Text = "Generate text to speech";
buttonGenerateTTS.Enabled = true;
_abort = false;
}
private void GenerateParagraphAudio(Subtitle subtitle, bool showProgressBar, string overrideFileName)
{
if (nikseComboBoxEngine.SelectedIndex == 0)
{
GenerateParagraphAudioMs(subtitle, showProgressBar);
GenerateParagraphAudioMs(subtitle, showProgressBar, overrideFileName);
}
else if (nikseComboBoxEngine.SelectedIndex == 1)
{
GenerateParagraphAudioPiperTts(subtitle, showProgressBar);
GenerateParagraphAudioPiperTts(subtitle, showProgressBar, overrideFileName);
}
else if (nikseComboBoxEngine.SelectedIndex == 2)
{
GenerateParagraphAudioTortoiseTts(subtitle, showProgressBar);
GenerateParagraphAudioTortoiseTts(subtitle, showProgressBar, overrideFileName);
}
else if (nikseComboBoxEngine.SelectedIndex == 3)
{
GenerateParagraphAudioMimic3(subtitle, showProgressBar);
GenerateParagraphAudioMimic3(subtitle, showProgressBar, overrideFileName);
}
}
@ -147,7 +194,14 @@ namespace Nikse.SubtitleEdit.Forms.Tts
var outputFileName = Path.Combine(_waveFolder, Path.GetFileNameWithoutExtension(audioFileName) + videoExt);
var addAudioProcess = VideoPreviewGenerator.AddAudioTrack(_videoFileName, audioFileName, outputFileName);
addAudioProcess.Start();
addAudioProcess.WaitForExit();
while (!addAudioProcess.HasExited)
{
Application.DoEvents();
if (_abort)
{
break;
}
}
labelProgress.Text = string.Empty;
}
@ -186,7 +240,13 @@ namespace Nikse.SubtitleEdit.Forms.Tts
var outputFileName1 = Path.Combine(_waveFolder, index + "_u.wav");
var trimProcess = VideoPreviewGenerator.TrimSilenceStartAndEnd(pFileName, outputFileName1);
trimProcess.Start();
trimProcess.WaitForExit();
while (!trimProcess.HasExited)
{
if (_abort)
{
return new List<string>();
}
}
var addDuration = 0d;
if (next != null && p.EndTime.TotalMilliseconds < next.StartTime.TotalMilliseconds)
@ -199,6 +259,11 @@ namespace Nikse.SubtitleEdit.Forms.Tts
}
}
if (_abort)
{
return new List<string>();
}
var waveInfo = UiUtil.GetVideoInfo(outputFileName1);
if (waveInfo.TotalMilliseconds <= p.DurationTotalMilliseconds + addDuration)
{
@ -211,7 +276,15 @@ namespace Nikse.SubtitleEdit.Forms.Tts
fileNames.Add(outputFileName2);
var mergeProcess = VideoPreviewGenerator.ChangeSpeed(outputFileName1, outputFileName2, (float)factor);
mergeProcess.Start();
mergeProcess.WaitForExit();
while (!mergeProcess.HasExited)
{
Application.DoEvents();
if (_abort)
{
return new List<string>();
}
}
}
return fileNames;
@ -248,7 +321,15 @@ namespace Nikse.SubtitleEdit.Forms.Tts
var mergeProcess = VideoPreviewGenerator.MergeAudioTracks(inputFileName, pFileName, outputFileName, (float)p.StartTime.TotalSeconds);
inputFileName = outputFileName;
mergeProcess.Start();
mergeProcess.WaitForExit();
while (!mergeProcess.HasExited)
{
Application.DoEvents();
if (_abort)
{
return string.Empty;
}
}
}
progressBar1.Visible = false;
@ -257,7 +338,7 @@ namespace Nikse.SubtitleEdit.Forms.Tts
return outputFileName;
}
private void GenerateParagraphAudioMs(Subtitle subtitle, bool showProgressBar)
private void GenerateParagraphAudioMs(Subtitle subtitle, bool showProgressBar, string overrideFileName)
{
progressBar1.Value = 0;
progressBar1.Maximum = subtitle.Paragraphs.Count;
@ -286,7 +367,8 @@ namespace Nikse.SubtitleEdit.Forms.Tts
}
var p = subtitle.Paragraphs[index];
synthesizer.SetOutputToWaveFile(Path.Combine(_waveFolder, index + ".wav"));
var wavFileName = Path.Combine(_waveFolder, string.IsNullOrEmpty(overrideFileName) ? index + ".wav" : overrideFileName);
synthesizer.SetOutputToWaveFile(wavFileName);
var builder = new PromptBuilder();
if (voiceInfo != null)
{
@ -322,7 +404,7 @@ namespace Nikse.SubtitleEdit.Forms.Tts
labelProgress.Text = string.Empty;
}
private bool GenerateParagraphAudioPiperTts(Subtitle subtitle, bool showProgressBar)
private bool GenerateParagraphAudioPiperTts(Subtitle subtitle, bool showProgressBar, string overrideFileName)
{
var ttsPath = Path.Combine(Configuration.DataDirectory, "TextToSpeech");
if (!Directory.Exists(ttsPath))
@ -338,7 +420,7 @@ namespace Nikse.SubtitleEdit.Forms.Tts
var piperExe = Path.Combine(piperPath, "piper.exe");
if (!File.Exists(piperExe))
if (Configuration.IsRunningOnWindows && !File.Exists(piperExe))
{
if (MessageBox.Show(string.Format(LanguageSettings.Current.Settings.DownloadX, "Piper Text To Speech"), "Subtitle Edit", MessageBoxButtons.YesNoCancel) != DialogResult.Yes)
{
@ -368,7 +450,7 @@ namespace Nikse.SubtitleEdit.Forms.Tts
}
var p = subtitle.Paragraphs[index];
var outputFileName = Path.Combine(_waveFolder, index + ".wav");
var outputFileName = Path.Combine(_waveFolder, string.IsNullOrEmpty(overrideFileName) ? index + ".wav" : overrideFileName);
if (File.Exists(outputFileName))
{
try
@ -420,7 +502,7 @@ namespace Nikse.SubtitleEdit.Forms.Tts
StartInfo =
{
WorkingDirectory = piperPath,
FileName = piperExe,
FileName = Configuration.IsRunningOnWindows ? piperExe : "piper",
Arguments = $"-m \"{voice.ModelShort}\" -c \"{voice.ConfigShort}\" -f out.wav",
UseShellExecute = false,
CreateNoWindow = true,
@ -433,7 +515,17 @@ namespace Nikse.SubtitleEdit.Forms.Tts
streamWriter.Write(p.Text);
streamWriter.Flush();
streamWriter.Close();
processPiper.WaitForExit();
while (!processPiper.HasExited)
{
Application.DoEvents();
if (_abort)
{
progressBar1.Visible = false;
labelProgress.Text = string.Empty;
return false;
}
}
var inputFile = Path.Combine(piperPath, "out.wav");
File.Move(inputFile, outputFileName);
@ -449,7 +541,7 @@ namespace Nikse.SubtitleEdit.Forms.Tts
return true;
}
private bool GenerateParagraphAudioTortoiseTts(Subtitle subtitle, bool showProgressBar)
private bool GenerateParagraphAudioTortoiseTts(Subtitle subtitle, bool showProgressBar, string overrideFileName)
{
var pythonFolder = Path.Combine(Environment.GetFolderPath(Environment.SpecialFolder.UserProfile),
"AppData",
@ -486,7 +578,7 @@ namespace Nikse.SubtitleEdit.Forms.Tts
}
var p = subtitle.Paragraphs[index];
var outputFileName = Path.Combine(_waveFolder, index + ".wav");
var outputFileName = Path.Combine(_waveFolder, string.IsNullOrEmpty(overrideFileName) ? index + ".wav" : overrideFileName);
var v = voice;
if (_actorAndVoices.Count > 0 && !string.IsNullOrEmpty(p.Actor))
@ -511,7 +603,16 @@ namespace Nikse.SubtitleEdit.Forms.Tts
};
processTortoiseTts.Start();
processTortoiseTts.WaitForExit();
while (!processTortoiseTts.HasExited)
{
Application.DoEvents();
if (_abort)
{
progressBar1.Visible = false;
labelProgress.Text = string.Empty;
return false;
}
}
var inputFile = Path.Combine(_waveFolder, $"{v}_0_2.wav");
File.Move(inputFile, outputFileName);
@ -527,7 +628,7 @@ namespace Nikse.SubtitleEdit.Forms.Tts
return true;
}
private void GenerateParagraphAudioMimic3(Subtitle subtitle, bool showProgressBar)
private void GenerateParagraphAudioMimic3(Subtitle subtitle, bool showProgressBar, string overrideFileName)
{
throw new NotImplementedException();
}
@ -667,8 +768,9 @@ namespace Nikse.SubtitleEdit.Forms.Tts
var text = TextBoxTest.Text;
var sub = new Subtitle();
sub.Paragraphs.Add(new Paragraph(text, 0, 2500));
GenerateParagraphAudio(sub, false);
var waveFileName = Path.Combine(_waveFolder, "0.wav");
var waveFileNameOnly = Guid.NewGuid() + ".wav";
GenerateParagraphAudio(sub, false, waveFileNameOnly);
var waveFileName = Path.Combine(_waveFolder, waveFileNameOnly);
using (var soundPlayer = new System.Media.SoundPlayer(waveFileName))
{
soundPlayer.Play();
@ -692,7 +794,7 @@ namespace Nikse.SubtitleEdit.Forms.Tts
}
finally
{
buttonTestVoice.Enabled = true;
TaskDelayHelper.RunDelayed(TimeSpan.FromSeconds(1), () => buttonTestVoice.Enabled = true);
}
}
}