From 42511ece3fde6431feb01f0576b153b2aafffefb Mon Sep 17 00:00:00 2001 From: Flammie Pirinen Date: Tue, 24 Jun 2014 16:14:43 +0100 Subject: Add Finnish abbreviations from omorfi --- scripts/share/nonbreaking_prefix.fi | 140 ++++++++++++++++++++++++++++++++++++ 1 file changed, 140 insertions(+) create mode 100644 scripts/share/nonbreaking_prefix.fi diff --git a/scripts/share/nonbreaking_prefix.fi b/scripts/share/nonbreaking_prefix.fi new file mode 100644 index 000000000..be3f66986 --- /dev/null +++ b/scripts/share/nonbreaking_prefix.fi @@ -0,0 +1,140 @@ +#Anything in this file, followed by a period (and an upper-case word), does NOT +#indicate an end-of-sentence marker. Special cases are included for prefixes +#that ONLY appear before 0-9 numbers. + +#This list is compiled from omorfi database +#by Tommi A Pirinen. + + +#any single upper case letter followed by a period is not a sentence ender +#(excluding I occasionally, but we leave it in usually upper case letters are +#initials in a name +A +B +C +D +E +F +G +H +I +J +K +L +M +N +O +P +Q +R +S +T +U +V +W +X +Y +Z +Å +Ä +Ö + +#List of titles. These are often followed by upper-case names, but do not indicate sentence breaks +alik +alil +amir +apul +apul.prof +arkkit +ass +assist +dipl +dipl.arkkit +dipl.ekon +dipl.ins +dipl.kielenk +dipl.kirjeenv +dipl.kosm +dipl.urk +dos +erikoiseläinl +erikoishammasl +erikoisl +erikoist +ev.luutn +evp +fil +ft +hallinton +hallintot +hammaslääket +jatk +jääk +kansaned +kapt +kapt.luutn +kenr +kenr.luutn +kenr.maj +kers +kirjeenv +kom +kom.kapt +komm +konst +korpr +luutn +maist +maj +Mr +Mrs +Ms +M.Sc +neuv +nimim +Ph.D +prof +puh.joht +pääll +res +san +siht +suom +sähköp +säv +toht +toim +toim.apul +toim.joht +toim.siht +tuom +ups +vänr +vääp +ye.ups +ylik +ylil +ylim +ylimatr +yliop +yliopp +ylip +yliv + +#misc - odd period-ending items that NEVER indicate breaks (p.m. does NOT fall +#into this category - it sometimes ends a sentence) +e.g +ent +esim +huom +i.e +ilm +l +mm +myöh +nk +nyk +par +po +t +v -- cgit v1.2.3 From 1da3df93bcd7e115d9bfe78888dc71460a544cc0 Mon Sep 17 00:00:00 2001 From: Flammie Pirinen Date: Thu, 4 Sep 2014 16:01:10 +0100 Subject: fix location and remove english notes --- scripts/share/nonbreaking_prefix.fi | 140 --------------------- .../nonbreaking_prefixes/nonbreaking_prefix.fi | 138 ++++++++++++++++++++ 2 files changed, 138 insertions(+), 140 deletions(-) delete mode 100644 scripts/share/nonbreaking_prefix.fi create mode 100644 scripts/share/nonbreaking_prefixes/nonbreaking_prefix.fi diff --git a/scripts/share/nonbreaking_prefix.fi b/scripts/share/nonbreaking_prefix.fi deleted file mode 100644 index be3f66986..000000000 --- a/scripts/share/nonbreaking_prefix.fi +++ /dev/null @@ -1,140 +0,0 @@ -#Anything in this file, followed by a period (and an upper-case word), does NOT -#indicate an end-of-sentence marker. Special cases are included for prefixes -#that ONLY appear before 0-9 numbers. - -#This list is compiled from omorfi database -#by Tommi A Pirinen. - - -#any single upper case letter followed by a period is not a sentence ender -#(excluding I occasionally, but we leave it in usually upper case letters are -#initials in a name -A -B -C -D -E -F -G -H -I -J -K -L -M -N -O -P -Q -R -S -T -U -V -W -X -Y -Z -Å -Ä -Ö - -#List of titles. These are often followed by upper-case names, but do not indicate sentence breaks -alik -alil -amir -apul -apul.prof -arkkit -ass -assist -dipl -dipl.arkkit -dipl.ekon -dipl.ins -dipl.kielenk -dipl.kirjeenv -dipl.kosm -dipl.urk -dos -erikoiseläinl -erikoishammasl -erikoisl -erikoist -ev.luutn -evp -fil -ft -hallinton -hallintot -hammaslääket -jatk -jääk -kansaned -kapt -kapt.luutn -kenr -kenr.luutn -kenr.maj -kers -kirjeenv -kom -kom.kapt -komm -konst -korpr -luutn -maist -maj -Mr -Mrs -Ms -M.Sc -neuv -nimim -Ph.D -prof -puh.joht -pääll -res -san -siht -suom -sähköp -säv -toht -toim -toim.apul -toim.joht -toim.siht -tuom -ups -vänr -vääp -ye.ups -ylik -ylil -ylim -ylimatr -yliop -yliopp -ylip -yliv - -#misc - odd period-ending items that NEVER indicate breaks (p.m. does NOT fall -#into this category - it sometimes ends a sentence) -e.g -ent -esim -huom -i.e -ilm -l -mm -myöh -nk -nyk -par -po -t -v diff --git a/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.fi b/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.fi new file mode 100644 index 000000000..466c6a837 --- /dev/null +++ b/scripts/share/nonbreaking_prefixes/nonbreaking_prefix.fi @@ -0,0 +1,138 @@ +#Anything in this file, followed by a period (and an upper-case word), does NOT +#indicate an end-of-sentence marker. Special cases are included for prefixes +#that ONLY appear before 0-9 numbers. + +#This list is compiled from omorfi database +#by Tommi A Pirinen. + + +#any single upper case letter followed by a period is not a sentence ender +A +B +C +D +E +F +G +H +I +J +K +L +M +N +O +P +Q +R +S +T +U +V +W +X +Y +Z +Å +Ä +Ö + +#List of titles. These are often followed by upper-case names, but do not indicate sentence breaks +alik +alil +amir +apul +apul.prof +arkkit +ass +assist +dipl +dipl.arkkit +dipl.ekon +dipl.ins +dipl.kielenk +dipl.kirjeenv +dipl.kosm +dipl.urk +dos +erikoiseläinl +erikoishammasl +erikoisl +erikoist +ev.luutn +evp +fil +ft +hallinton +hallintot +hammaslääket +jatk +jääk +kansaned +kapt +kapt.luutn +kenr +kenr.luutn +kenr.maj +kers +kirjeenv +kom +kom.kapt +komm +konst +korpr +luutn +maist +maj +Mr +Mrs +Ms +M.Sc +neuv +nimim +Ph.D +prof +puh.joht +pääll +res +san +siht +suom +sähköp +säv +toht +toim +toim.apul +toim.joht +toim.siht +tuom +ups +vänr +vääp +ye.ups +ylik +ylil +ylim +ylimatr +yliop +yliopp +ylip +yliv + +#misc - odd period-ending items that NEVER indicate breaks (p.m. does NOT fall +#into this category - it sometimes ends a sentence) +e.g +ent +esim +huom +i.e +ilm +l +mm +myöh +nk +nyk +par +po +t +v -- cgit v1.2.3