Added Lithuanian language auto-detection

This commit is contained in:
Nikolaj Olsson 2016-11-19 22:30:47 +01:00
parent 5511d2df9e
commit e7b5e6e66f

View File

@ -135,6 +135,7 @@ namespace Nikse.SubtitleEdit.Core
"[Aa]?[Ll]ebo", "[Pp]ri", "[Pp]re", "([Íí]sť|[Ii](?:dem|de|deme|dú))", "[Pp]red.*", "[Mm]edzi", "[Ee]šte", "[Čč]lovek", "[Pp]odľa", "[Ďď]alš(í|ia|ie)" };
private static readonly string[] AutoDetectWordsLatvian = { "Paldies", "neesmu ", "nezinu", "viòð", "viņš", "viņu", "kungs", "esmu", "Viņš", "Velns", "viņa", "dievs", "Pagaidi", "varonis", "agrāk", "varbūt" };
private static readonly string[] AutoDetectWordsLithuanian = { "tavęs", "veidai", "apie", "jums", "Veidai", "Kaip", "kaip", "reikia", "Šūdas", "frensis", "Ačiū", "vilsonai", "Palauk", "Veidas", "viskas", "Tikrai", "manęs", "Tačiau", "žmogau", "Flagai", "Prašau", "Džiune", "Nakties", "šviesybe" };
private static string AutoDetectGoogleLanguage(string text, int bestCount)
{
@ -298,6 +299,9 @@ namespace Nikse.SubtitleEdit.Core
count = GetCount(text, AutoDetectWordsCzechAndSlovak);
if (count > bestCount)
{
var lithuanianCount = GetCount(text, AutoDetectWordsLithuanian);
if (lithuanianCount <= count)
{
int czechWordsCount = GetCount(text, AutoDetectWordsCzech);
int slovakWordsCount = GetCount(text, AutoDetectWordsSlovak);
@ -305,11 +309,16 @@ namespace Nikse.SubtitleEdit.Core
return "cs"; // Czech
return "sk"; // Slovak
}
}
count = GetCount(text, AutoDetectWordsLatvian);
if (count > bestCount * 1.2)
return "lv";
count = GetCount(text, AutoDetectWordsLithuanian);
if (count > bestCount)
return "lt";
return string.Empty;
}
@ -551,7 +560,13 @@ namespace Nikse.SubtitleEdit.Core
case "cs_CZ": // Czech
count = GetCount(text, AutoDetectWordsCzech);
if (count > bestCount)
{
var lithuanianCount = GetCount(text, AutoDetectWordsLithuanian);
if (count > lithuanianCount)
{
languageName = shortName;
}
}
break;
case "sk_SK": // Slovak
count = GetCount(text, AutoDetectWordsSlovak);
@ -563,6 +578,12 @@ namespace Nikse.SubtitleEdit.Core
if (count > bestCount)
languageName = shortName;
break;
case "lt_LT": // Lithuanian
case "lt": // Lithuanian
count = GetCount(text, AutoDetectWordsLithuanian);
if (count > bestCount)
languageName = shortName;
break;
}
}
return languageName;