typography/php-typography/lang/fi.php

396 lines
8.4 KiB
PHP

<?php
/*
Project: PHP Typography
Project URI: http://kingdesk.com/projects/php-typography/
File modified to place pattern and exceptions in arrays that can be understood in php files.
This file is released under the same copyright as the below referenced original file
Original unmodified file is available at: http://mirror.unl.edu/ctan/language/hyph-utf8/tex/generic/hyph-utf8/patterns/
Original file name: hyph-_______________.tex
//============================================================================================================
ORIGINAL FILE INFO
% This file is part of hyph-utf8 package and resulted from
% semi-manual conversions of hyphenation patterns into UTF-8 in June 2008.
%
% Source: fihyph.tex (yyyy-mm-dd)
% Author: Kauko Saarinen
%
% The above mentioned file should become obsolete,
% and the author of the original file should preferaby modify this file instead.
%
% Modificatios were needed in order to support native UTF-8 engines,
% but functionality (hopefully) didn't change in any way, at least not intentionally.
% This file is no longer stand-alone; at least for 8-bit engines
% you probably want to use loadhyph-foo.tex (which will load this file) instead.
%
% Modifications were done by Jonathan Kew, Mojca Miklavec & Arthur Reutenauer
% with help & support from:
% - Karl Berry, who gave us free hands and all resources
% - Taco Hoekwater, with useful macros
% - Hans Hagen, who did the unicodifisation of patterns already long before
% and helped with testing, suggestions and bug reports
% - Norbert Preining, who tested & integrated patterns into TeX Live
%
% However, the 'copyright/copyleft' owner of patterns remains the original author.
%
% The copyright statement of this file is thus:
%
% Do with this file whatever needs to be done in future for the sake of
% 'a better world' as long as you respect the copyright of original file.
% If you're the original author of patterns or taking over a new revolution,
% plese remove all of the TUG comments & credits that we added here -
% you are the Queen / the King, we are only the servants.
%
% If you want to change this file, rather than uploading directly to CTAN,
% we would be grateful if you could send it to us (http://tug.org/tex-hyphen)
% or ask for credentials for SVN repository and commit it yourself;
% we will then upload the whole 'package' to CTAN.
%
% Before a new 'pattern-revolution' starts,
% please try to follow some guidelines if possible:
%
% - \lccode is *forbidden*, and I really mean it
% - all the patterns should be in UTF-8
% - the only 'allowed' TeX commands in this file are: \patterns, \hyphenation,
% and if you really cannot do without, also \input and \message
% - in particular, please no \catcode or \lccode changes,
% they belong to loadhyph-foo.tex,
% and no \lefthyphenmin and \righthyphenmin,
% they have no influence here and belong elsewhere
% - \begingroup and/or \endinput is not needed
% - feel free to do whatever you want inside comments
%
% We know that TeX is extremely powerful, but give a stupid parser
% at least a chance to read your patterns.
%
% For more unformation see
%
% http://tug.org/tex-hyphen
%
%------------------------------------------------------------------------------
%
% -----> Finnish hyphenation patterns for MLPCTeX <------
% First release January -86 by Kauko Saarinen,
% Computing Centre, University of Jyvaskyla, Finland
%
% Completely rewritten January -88. The new patterns make
% much less mistakes with foreign and compound words.
% The article 'Automatic Hyphenation of Finnish'
% by Professor Fred Karlsson is also referred
% ---------------------------------------------------------
%
% 8th March -89 (vers. 2.2), some vowel triples by Fred Karlsson added.
% 9th January - 95: added \uccode and \lccode by Thomas Esser
%
% ********* Patterns may be freely distributed **********
%
//============================================================================================================
*/
$patgenLanguage = 'Finnish';
$patgenExceptions = array();
$patgenMaxSeg = 7;
$patgen = array(
'begin'=>array(
'ä'=>'02',
'ydin'=>'00021',
'suura'=>'000212'
),
'end'=>array(
'sidea'=>'212000'
),
'all'=>array(
'ba'=>'100',
'be'=>'100',
'bi'=>'100',
'bo'=>'100',
'bu'=>'100',
'by'=>'100',
'da'=>'100',
'de'=>'100',
'di'=>'100',
'do'=>'100',
'du'=>'100',
'dy'=>'100',
'dä'=>'100',
'dö'=>'100',
'fa'=>'100',
'fe'=>'100',
'fi'=>'100',
'fo'=>'100',
'fu'=>'100',
'fy'=>'100',
'ga'=>'100',
'ge'=>'100',
'gi'=>'100',
'go'=>'100',
'gu'=>'100',
'gy'=>'100',
'gä'=>'100',
'gö'=>'100',
'ha'=>'100',
'he'=>'100',
'hi'=>'100',
'ho'=>'100',
'hu'=>'100',
'hy'=>'100',
'hä'=>'100',
'hö'=>'100',
'ja'=>'100',
'je'=>'100',
'ji'=>'100',
'jo'=>'100',
'ju'=>'100',
'jy'=>'100',
'jä'=>'100',
'jö'=>'100',
'ka'=>'100',
'ke'=>'100',
'ki'=>'100',
'ko'=>'100',
'ku'=>'100',
'ky'=>'100',
'kä'=>'100',
'kö'=>'100',
'la'=>'100',
'le'=>'100',
'li'=>'100',
'lo'=>'100',
'lu'=>'100',
'ly'=>'100',
'lä'=>'100',
'lö'=>'100',
'ma'=>'100',
'me'=>'100',
'mi'=>'100',
'mo'=>'100',
'mu'=>'100',
'my'=>'100',
'mä'=>'100',
'mö'=>'100',
'na'=>'100',
'ne'=>'100',
'ni'=>'100',
'no'=>'100',
'nu'=>'100',
'ny'=>'100',
'nä'=>'100',
'nö'=>'100',
'pa'=>'100',
'pe'=>'100',
'pi'=>'100',
'po'=>'100',
'pu'=>'100',
'py'=>'100',
'pä'=>'100',
'pö'=>'100',
'ra'=>'100',
're'=>'100',
'ri'=>'100',
'ro'=>'100',
'ru'=>'100',
'ry'=>'100',
'rä'=>'100',
'rö'=>'100',
'sa'=>'100',
'se'=>'100',
'si'=>'100',
'so'=>'100',
'su'=>'100',
'sy'=>'100',
'sä'=>'100',
'sö'=>'100',
'ta'=>'100',
'te'=>'100',
'ti'=>'100',
'to'=>'100',
'tu'=>'100',
'ty'=>'100',
'tä'=>'100',
'tö'=>'100',
'va'=>'100',
've'=>'100',
'vi'=>'100',
'vo'=>'100',
'vu'=>'100',
'vy'=>'100',
'vä'=>'100',
'vö'=>'100',
'str'=>'1020',
'äy'=>'020',
'ya'=>'012',
'yo'=>'012',
'oy'=>'010',
'öy'=>'020',
'uy'=>'012',
'yu'=>'012',
'öa'=>'032',
'öo'=>'032',
'äa'=>'032',
'äo'=>'032',
'äu'=>'012',
'öu'=>'012',
'aä'=>'010',
'aö'=>'010',
'oä'=>'010',
'oö'=>'010',
'uä'=>'012',
'uö'=>'012',
'ää'=>'020',
'öö'=>'020',
'äö'=>'020',
'öä'=>'020',
'aai'=>'0012',
'aae'=>'0012',
'aao'=>'0012',
'aau'=>'0012',
'eea'=>'0012',
'eei'=>'0012',
'eeu'=>'0012',
'eey'=>'0012',
'iia'=>'0012',
'iie'=>'0012',
'iio'=>'0012',
'uua'=>'0012',
'uue'=>'0012',
'uuo'=>'0012',
'uui'=>'0012',
'eaa'=>'0100',
'iaa'=>'0100',
'oaa'=>'0100',
'uaa'=>'0100',
'uee'=>'0100',
'auu'=>'0100',
'iuu'=>'0100',
'euu'=>'0100',
'ouu'=>'0100',
'ääi'=>'0010',
'ääe'=>'0010',
'ääy'=>'0030',
'iää'=>'0100',
'eää'=>'0100',
'yää'=>'0100',
'iöö'=>'0100',
'aei'=>'0100',
'aoi'=>'0100',
'eai'=>'0100',
'iau'=>'0100',
'yei'=>'0100',
'aia'=>'0010',
'aie'=>'0010',
'aio'=>'0010',
'aiu'=>'0010',
'aua'=>'0010',
'aue'=>'0010',
'eua'=>'0010',
'iea'=>'0010',
'ieo'=>'0010',
'iey'=>'0010',
'ioa'=>'0012',
'ioe'=>'0012',
'iua'=>'0010',
'iue'=>'0010',
'iuo'=>'0010',
'oia'=>'0010',
'oie'=>'0010',
'oio'=>'0010',
'oiu'=>'0010',
'oui'=>'0100',
'oue'=>'0010',
'ouo'=>'0010',
'uea'=>'0010',
'uie'=>'0010',
'uoa'=>'0010',
'uou'=>'0010',
'eö'=>'012',
'öe'=>'012',
'us'=>'020',
'yliop'=>'000120',
'aliav'=>'000120',
'spli'=>'10200',
'alous'=>'000001',
'keus'=>'00001',
'rtaus'=>'000001',
'sohje'=>'210000',
'sasia'=>'212000',
'asian'=>'120000',
'asiat'=>'120000',
'asioi'=>'120000',
'ras'=>'0200',
'las'=>'0200',
'sopisk'=>'2120000',
'nopet'=>'212000',
'saloi'=>'212000',
'nopist'=>'2120000',
'sopist'=>'2120000',
'sosa'=>'21200',
'nosa'=>'21200',
'alkeis'=>'0000021',
'perus'=>'000001',
'sidean'=>'2120000',
'sesity'=>'2120000',
'nedus'=>'212000',
'sajatu'=>'2100000',
'sase'=>'21000',
'sapu'=>'21000',
'syrit'=>'212000',
'syhti'=>'212000',
'notto'=>'210000',
'noton'=>'210000',
'nanto'=>'210000',
'nanno'=>'210000',
'najan'=>'212000',
'naika'=>'210000',
'nomai'=>'212000',
'nylit'=>'212000',
'salen'=>'212000',
'nalen'=>'212000',
'asiakas'=>'12000021',
'ulos'=>'00021',
'najo'=>'21200',
'sajo'=>'21200',
'bl'=>'020',
'blo'=>'1200',
'bibli'=>'000300',
'br'=>'020',
'bri'=>'1200',
'bro'=>'1200',
'bru'=>'1200',
'dr'=>'020',
'dra'=>'1200',
'fl'=>'020',
'fla'=>'1200',
'fr'=>'020',
'fra'=>'1200',
'fre'=>'1200',
'gl'=>'020',
'glo'=>'1200',
'gr'=>'020',
'gra'=>'1200',
'kl'=>'020',
'kra'=>'1200',
'kre'=>'1200',
'kri'=>'1200',
'kv'=>'120',
'kva'=>'1200',
'pl'=>'020',
'pr'=>'020',
'pro'=>'1200',
'cl'=>'020',
'qv'=>'020',
'qvi'=>'1200',
'sch'=>'0020',
'tsh'=>'0020',
'chr'=>'0020'
)
);
?>