[OcrEngine] - init hashsets in one run.

This commit is contained in:
Ivandro Ismael 2016-09-07 03:00:22 +01:00
parent ce0f2fdd37
commit df72c62c57
No known key found for this signature in database
GPG Key ID: A8832757DEFB7EDC

View File

@ -208,33 +208,27 @@ namespace Nikse.SubtitleEdit.Logic.Ocr
_namesEtcList = _namesList.GetNames(); _namesEtcList = _namesList.GetNames();
_namesEtcMultiWordList = _namesList.GetMultiNames(); _namesEtcMultiWordList = _namesList.GetMultiNames();
_namesEtcListUppercase = new HashSet<string>(); _namesEtcListUppercase = new HashSet<string>();
foreach (string name in _namesEtcList)
_namesEtcListUppercase.Add(name.ToUpper());
_namesEtcListWithApostrophe = new HashSet<string>(); _namesEtcListWithApostrophe = new HashSet<string>();
if (threeLetterIsoLanguageName.Equals("eng", StringComparison.OrdinalIgnoreCase))
{
foreach (string namesItem in _namesEtcList)
{
if (!namesItem.EndsWith('s'))
_namesEtcListWithApostrophe.Add(namesItem + "'s");
else
_namesEtcListWithApostrophe.Add(namesItem + "'");
}
}
// Load user words
_userWordList = new HashSet<string>();
_userWordListXmlFileName = Utilities.LoadUserWordList(_userWordList, _fiveLetterWordListLanguageName);
// Find abbreviations
_abbreviationList = new HashSet<string>(); _abbreviationList = new HashSet<string>();
bool isEnglish = threeLetterIsoLanguageName.Equals("eng", StringComparison.OrdinalIgnoreCase);
foreach (string name in _namesEtcList) foreach (string name in _namesEtcList)
{ {
_namesEtcListUppercase.Add(name.ToUpper());
if (isEnglish)
{
if (!name.EndsWith('s'))
_namesEtcListWithApostrophe.Add(name + "'s");
else
_namesEtcListWithApostrophe.Add(name + "'");
}
// Abbreviations.
if (name.EndsWith('.')) if (name.EndsWith('.'))
{
_abbreviationList.Add(name); _abbreviationList.Add(name);
} }
if (threeLetterIsoLanguageName.Equals("eng", StringComparison.OrdinalIgnoreCase)) }
if (isEnglish)
{ {
if (!_abbreviationList.Contains("a.m.")) if (!_abbreviationList.Contains("a.m."))
_abbreviationList.Add("a.m."); _abbreviationList.Add("a.m.");
@ -243,7 +237,9 @@ namespace Nikse.SubtitleEdit.Logic.Ocr
if (!_abbreviationList.Contains("o.r.")) if (!_abbreviationList.Contains("o.r."))
_abbreviationList.Add("o.r."); _abbreviationList.Add("o.r.");
} }
// Load user words
_userWordList = new HashSet<string>();
_userWordListXmlFileName = Utilities.LoadUserWordList(_userWordList, _fiveLetterWordListLanguageName);
foreach (string name in _userWordList) foreach (string name in _userWordList)
{ {
if (name.EndsWith('.')) if (name.EndsWith('.'))