Update hrv_OCRFixReplaceList.xml

This commit is contained in:
May Kittens Devour Your Soul 2022-01-26 13:34:46 +01:00 committed by GitHub
parent e0bfd5fe8d
commit 7d2600831f
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -2,6 +2,7 @@
<OCRFixReplaceList>
<WholeWords>
<Word from="()d" to="Od" />
<Word from="ae" to="se" />
<Word from="aam" to="sam" />
<Word from="advokati" to="odvjetnici" />
<Word from="Advokati" to="Odvjetnici" />
@ -16,6 +17,7 @@
<Word from="Ajpodu" to="iPodu" />
<Word from="akcenat" to="naglasak" />
<Word from="aki" to="ali" />
<Word from="akp" to="ako" />
<Word from="akcionara" to="dioničara" />
<Word from="aktuelan" to="aktualan" />
<Word from="akvarijum" to="akvarij" />
@ -99,11 +101,13 @@
<Word from="braon" to="smeđa" />
<Word from="bregu" to="brijegu" />
<Word from="bti" to="biti" />
<Word from="budr" to="bude" />
<Word from="buđav" to="pljesniv" />
<Word from="cedila" to="cijedila" />
<Word from="cedilu" to="cjedilu" />
<Word from="cenzurisan" to="cenzuriran" />
<Word from="cenzurisana" to="cenzurirana" />
<Word from="cenzurišeš" to="cenzuriraš" />
<Word from="ceo" to="cijeli" />
<Word from="Ceo" to="Cijeli" />
<Word from="cepa" to="cijepa" />
@ -264,6 +268,7 @@
<Word from="dobijao" to="dobivao" />
<Word from="dobijati" to="dobivati" />
<Word from="doči" to="doći" />
<Word from="dode" to="dođe" />
<Word from="dodju" to="dođu" />
<Word from="dole" to="dolje" />
<Word from="Dole" to="Dolje" />
@ -275,6 +280,7 @@
<!-- nije za regex [ni dospeo - ni dospeju - mora ostati ovako] -->
<Word from="dospeo" to="dospio" />
<Word from="dospeju" to="dospiju" />
<Word from="doše" to="dođe" />
<Word from="dođavola" to="dovraga" />
<Word from="Dođavola" to="Dovraga" />
<Word from="dotera" to="dotjera" />
@ -431,6 +437,7 @@
<Word from="Iči" to="Ići" />
<Word from="iduči" to="idući" />
<Word from="iko" to="itko" />
<Word from="imq" to="ima" />
<Word from="imap" to="imao" />
<Word from="imamp" to="imamo" />
<Word from="ignoriši" to="ignoriraj" />
@ -467,6 +474,8 @@
<Word from="istrebiti" to="istrijebiti" />
<Word from="isuviše" to="previše" />
<Word from="iščupaću" to="iščupat ću" />
<Word from="iszom" to="istom" />
<Word from="ive" to="ove" />
<Word from="ivica" to="rub" />
<Word from="ivice" to="ruba" />
<Word from="ivici" to="rubu" />
@ -788,7 +797,8 @@
<Word from="matorom" to="starom" />
<Word from="mego" to="nego" />
<Word from="mehur" to="mjehur" />
<Word from="menom" to="mnom" />
<Word from="menom" to="mnom" />
<Word from="menjanja" to="mijenjanja" />
<Word from="menr" to="mene" />
<Word from="menjajući" to="mijenjajući" />
<Word from="merač" to="mjerač" />
@ -830,6 +840,8 @@
<Word from="Muzika" to="Glazba" />
<Word from="Muzike" to="Glazbe" />
<Word from="Muzikom" to="Glazbom" />
<Word from="Nr" to="Ne" />
<Word from="nr" to="ne" />
<Word from="ns" to="na" />
<Word from="nači" to="naći" />
<Word from="nadevati" to="nadijevati" />
@ -964,6 +976,7 @@
<Word from="Obe" to="Obje" />
<Word from="obema" to="objema" />
<Word from="obezbede" to="osiguraju" />
<Word from="obezbediću" to="osigurat ću" />
<Word from="Obezbeđuju" to="Osiguravaju" />
<Word from="obezbeđuju" to="osiguravaju" />
<Word from="objekat" to="objekt" />
@ -1316,6 +1329,7 @@
<Word from="Prijatan" to="Ugodan" />
<Word from="prijw" to="prije" />
<Word from="primećivao" to="primjećivao" />
<Word from="primećivala" to="primjećivala" />
<Word from="primedbi" to="primjedbi" />
<Word from="primjete" to="primijete" />
<Word from="prisetim" to="prisjetim" />
@ -1472,6 +1486,7 @@
<Word from="sečivo" to="sječivo" />
<Word from="sečiva" to="sječiva" />
<Word from="sedećeš" to="sjedit ćeš" />
<Word from="sedeo" to="sjedio" />
<Word from="sedeli" to="sjedili" />
<Word from="sedišta" to="sjedala" />
<Word from="sedište" to="sjedalo" />
@ -1674,6 +1689,7 @@
<Word from="Stideo" to="Stidio" />
<Word from="stidela" to="stidjela" />
<Word from="stiditi" to="stidjeti" />
<Word from="stim" to="s tim" />
<Word from="stovri" to="stvori" />
<Word from="streljamo" to="strijeljamo" />
<Word from="streljati" to="strijeljati" />
@ -1704,6 +1720,7 @@
<Word from="Supu" to="Juhu" />
<Word from="Supom" to="Juhom" />
<Word from="Supama" to="Juhama" />
<Word from="supet" to="super" />
<Word from="surfovat" to="surfat" />
<Word from="surfovati" to="surfati" />
<Word from="surfuje" to="surfa" />
@ -1733,6 +1750,7 @@
<Word from="Suvu" to="Suhu" />
<Word from="Svestan" to="Svjestan" />
<Word from="svestan" to="svjestan" />
<Word from="svida" to="sviđa" />
<Word from="svidja" to="sviđa" />
<Word from="svjest" to="svijest" />
<Word from="Svjest" to="Svijest" />
@ -2092,6 +2110,7 @@
<Word from="zasede" to="zasjede" />
<Word from="zasedi" to="zasjedi" />
<Word from="zasedu" to="zasjedu" />
<Word from="zaslepi" to="zaslijepi" />
<Word from="zastideo" to="zastidio" />
<Word from="zatp" to="zato" />
<Word from="Zatp" to="Zato" />
@ -3162,6 +3181,7 @@
<RegEx find="(?&lt;![mn])o(d?)se([kć])(?!s)" replaceWith="o$1sje$2" />
<RegEx find="odu?hvat" replaceWith="othvat" />
<RegEx find="(?&lt;!r)oent" replaceWith="oant" />
<RegEx find="oljnj" replaceWith="onj" />
<RegEx find="ovatn" replaceWith="ojatn" />
<RegEx find="overn" replaceWith="ovjern" />
<RegEx find="ovren" replaceWith="ovoren" />
@ -3589,6 +3609,7 @@
<RegEx find="begl" replaceWith="bjegl" />
<RegEx find="bmi" replaceWith="bni" />
<RegEx find="bpl" replaceWith="bol" />
<RegEx find="bsl" replaceWith="bal" />
<RegEx find="bs([to])" replaceWith="ps$1" />
<RegEx find="iliše" replaceWith="ilizira" />
<RegEx find="ilišu" replaceWith="iliziraju" />
@ -3603,15 +3624,17 @@
<RegEx find="cjenil" replaceWith="cijenil" />
<RegEx find="coje" replaceWith="cije" />
<RegEx find="ćnot" replaceWith="ćnost" />
<RegEx find="čmos" replaceWith="čnos" />
<RegEx find="diba" replaceWith="dina" />
<RegEx find="dišl" replaceWith="dišn" />
<RegEx find="dks" replaceWith="dsk" />
<RegEx find="dnačin" replaceWith="dnadžb" />
<RegEx find="dnp" replaceWith="dno" />
<RegEx find="dps" replaceWith="dos" />
<RegEx find="dps" replaceWith="dos" />
<RegEx find="domač" replaceWith="domać" />
<RegEx find="\bdral" replaceWith="deral" />
<RegEx find="dranj" replaceWith="deranj" />
<RegEx find="dqj" replaceWith="daj" />
<RegEx find="dsek" replaceWith="dsjek" />
<RegEx find="[dt]cj?en(i|jen)" replaceWith="dcijen$1" />
<RegEx find="(?&lt;![dt])cj?enim" replaceWith="cijenim" />
@ -3640,6 +3663,7 @@
<RegEx find="esvest" replaceWith="esvijest" />
<RegEx find="etektov" replaceWith="etektir" />
<RegEx find="evać" replaceWith="evat ć" />
<RegEx find="ezk" replaceWith="etk" />
<RegEx find="fanziv" replaceWith="fenziv" />
<RegEx find="fejs" replaceWith="face" />
<RegEx find="figurisa" replaceWith="figurira" />
@ -3653,6 +3677,8 @@
<RegEx find="frov" replaceWith="frir" />
<RegEx find="gačuj" replaceWith="gaćuj" />
<RegEx find="glda" replaceWith="gleda" />
<RegEx find="gpd" replaceWith="god" />
<RegEx find="gpt" replaceWith="got" />
<RegEx find="grišć" replaceWith="grist ć" />
<RegEx find="(?&lt;!e)grš" replaceWith="greš" />
<RegEx find="grutova" replaceWith="grutira" />
@ -3695,14 +3721,17 @@
<RegEx find="ledov" replaceWith="ljedov" />
<RegEx find="lj?epić" replaceWith="lijepit ć" />
<RegEx find="lepš" replaceWith="ljepš" />
<RegEx find="lkm" replaceWith="lim" />
<RegEx find="ljubc" replaceWith="ljupc" />
<RegEx find="ljutić" replaceWith="ljutit ć" />
<RegEx find="lpg" replaceWith="log" />
<RegEx find="lrd" replaceWith="led" />
<RegEx find="lša" replaceWith="iša" />
<RegEx find="Lša" replaceWith="Iša" />
<RegEx find="ltovan" replaceWith="ltiran" />
<RegEx find="l([ou])žić" replaceWith="l$1žit ć" />
<RegEx find="luparenj" replaceWith="lupiranj" />
<RegEx find="lwn" replaceWith="lan" />
<RegEx find="mbog" replaceWith="mnog" />
<RegEx find="(?&lt;![Mm])ekd" replaceWith="egd" />
<RegEx find="([mv])ešten" replaceWith="$1ješten" />
@ -3721,6 +3750,7 @@
<RegEx find="nimp" replaceWith="nimo" />
<RegEx find="(?&lt;!a)nks" replaceWith="nsk" />
<RegEx find="ngažuj" replaceWith="ngažiraj" />
<RegEx find="nkm" replaceWith="nom" />
<RegEx find="nho" replaceWith="nko" />
<RegEx find="nisa([nlot])" replaceWith="nira$1" />
<RegEx find="(?&lt;!am)nesti" replaceWith="nijeti" />
@ -3742,6 +3772,7 @@
<RegEx find="ntišu" replaceWith="ntiraju" />
<RegEx find="ntitj?el" replaceWith="ntitijel" />
<RegEx find="ntv" replaceWith="nstv" />
<RegEx find="nwt" replaceWith="net" />
<RegEx find="nwz" replaceWith="nez" />
<RegEx find="nzuje" replaceWith="nzira" />
<RegEx find="atursk" replaceWith="aturaln" />
@ -3805,6 +3836,7 @@
<RegEx find="pulis" replaceWith="pulir" />
<RegEx find="pva" replaceWith="ova" />
<RegEx find="pzn" replaceWith="pozn" />
<RegEx find="rdk" replaceWith="rek" />
<RegEx find="riaj" replaceWith="rija" />
<RegEx find="rićemo" replaceWith="rit ćemo" />
<RegEx find="rčaće" replaceWith="rčat će" />
@ -3816,6 +3848,7 @@
<RegEx find="(?&lt;!r)ojd" replaceWith="ojed" />
<RegEx find="rpeu" replaceWith="preu" />
<RegEx find="rqm" replaceWith="ram" />
<RegEx find="rqt" replaceWith="rat" />
<RegEx find="([rv])pd" replaceWith="$1od" />
<RegEx find="rsd" replaceWith="rad" />
<RegEx find="rsv" replaceWith="rav" />
@ -3911,6 +3944,7 @@
<RegEx find="vetr" replaceWith="vjetr" />
<RegEx find="visić" replaceWith="visit ć" />
<RegEx find="visa([lt])" replaceWith="vira$1" />
<RegEx find="vkr" replaceWith="vor" />
<RegEx find="([vV])jeov" replaceWith="$1jerov" />
<RegEx find="vješč" replaceWith="vješć" />
<RegEx find="vljstv" replaceWith="voljstv" />
@ -3919,6 +3953,7 @@
<RegEx find="vld" replaceWith="vlad" />
<RegEx find="vnr" replaceWith="vne" />
<RegEx find="vnsk" replaceWith="vinsk" />
<RegEx find="voei" replaceWith="vori" />
<RegEx find="(?&lt;!d)vof" replaceWith="vog" />
<RegEx find="vpj" replaceWith="voj" />
<RegEx find="vpm" replaceWith="vom" />
@ -3937,6 +3972,7 @@
<RegEx find="zpr" replaceWith="spr" />
<RegEx find="zsp" replaceWith="zap" />
<RegEx find="zsn" replaceWith="zan" />
<RegEx find="zqp" replaceWith="zap" />
<RegEx find="zuslov" replaceWith="zuvjet" />
<RegEx find="zvešć" replaceWith="zvest ć" />
<RegEx find="zvolić" replaceWith="zvolit ć" />
@ -3949,6 +3985,7 @@
<RegEx find="Afghanistan" replaceWith="Afganistan" />
<RegEx find="Ajdah" replaceWith="Idah" />
<RegEx find="Ajl[ae]nd" replaceWith="Island" />
<RegEx find="Ajvs" replaceWith="Yves" />
<RegEx find="Ajzak" replaceWith="Isaac" />
<RegEx find="Ajzenhauer" replaceWith="Eisenhower" />
<RegEx find="([aA])l[cz]h[ae]jmer" replaceWith="$1lzheimer" />
@ -4006,6 +4043,7 @@
<RegEx find="\bĐovani" replaceWith="Giovanni" />
<RegEx find="Hari" replaceWith="Harry" />
<RegEx find="Hauard" replaceWith="Howard" />
<RegEx find="Hemtons" replaceWith="Hamptons" />
<RegEx find="Hitrou" replaceWith="Heathrow" />
<RegEx find="Hrist" replaceWith="Krist" />
<RegEx find="Holandij" replaceWith="Nizozemsk" />
@ -4048,6 +4086,7 @@
<RegEx find="Metju" replaceWith="Matthew" />
<RegEx find="Mexic" replaceWith="Meksik" />
<RegEx find="ičigen" replaceWith="ichigan" />
<RegEx find="Misuri" replaceWith="Missouri" />
<RegEx find="Misisipi" replaceWith="Mississippi" />
<RegEx find="Mocart" replaceWith="Mozart" />
<RegEx find="Nejt" replaceWith="Nate" />