Small additions to Dutch OCRFixReplaceList.xml

Try 3, thanks to xylographe, hopefully finetuned now.
This commit is contained in:
Betsy25 2015-08-07 03:57:01 +02:00
parent 18df8da37d
commit 551ac1a172

View File

@ -6,14 +6,6 @@
<Word from="ledereen" to="Iedereen" />
<Word from="ledere" to="Iedere" />
<Word from="lemand" to="Iemand" />
<Word from="lsolement" to="Isolement" />
<Word from="ler" to="Ier" />
<Word from="lerland" to="Ierland" />
<Word from="lers" to="Iers" />
<Word from="lerse" to="Ierse" />
<Word from="eIk" to="elk" />
<Word from="eIkaar" to="elkaar" />
<Word from="eIke" to="elke" />
</WholeWords>
<PartialWordsAlways />
<PartialWords />
@ -23,6 +15,12 @@
<EndLines />
<WholeLines />
<RegularExpressions>
<RegEx find="\blk(?=\p{Ll}{2})" replaceWith="Ik" />
<RegEx find="\bln(?=\p{Ll}{2})" replaceWith="In" />
<RegEx find="\bls(?=\p{Ll}{2})" replaceWith="Is" />
<RegEx find="\beIk" replaceWith="elk" />
<RegEx find="\blsol" replaceWith="Isol" />
<RegEx find="\bler\b" replaceWith="Ier" />
<RegEx find="\bler(land|se|s)\b" replaceWith="Ier$1" />
</RegularExpressions>
</OCRFixReplaceList>