545 lines
14 KiB
PHP
545 lines
14 KiB
PHP
<?php
|
|
/*
|
|
Project: PHP Typography
|
|
Project URI: http://kingdesk.com/projects/php-typography/
|
|
|
|
File modified to place pattern and exceptions in arrays that can be understood in php files.
|
|
This file is released under the same copyright as the below referenced original file
|
|
Original unmodified file is available at: http://mirror.unl.edu/ctan/language/hyph-utf8/tex/generic/hyph-utf8/patterns/
|
|
Original file name: hyph-la.tex
|
|
|
|
//============================================================================================================
|
|
ORIGINAL FILE INFO
|
|
|
|
% This file is part of hyph-utf8 package and resulted from
|
|
% semi-manual conversions of hyphenation patterns into UTF-8 in June 2008.
|
|
%
|
|
% Source: lahyph.tex (2007-09-03)
|
|
% Author: Claudio Beccari <claudio.beccari at polito.it>
|
|
%
|
|
% The above mentioned file should become obsolete,
|
|
% and the author of the original file should preferaby modify this file instead.
|
|
%
|
|
% Modificatios were needed in order to support native UTF-8 engines,
|
|
% but functionality (hopefully) didn't change in any way, at least not intentionally.
|
|
% This file is no longer stand-alone; at least for 8-bit engines
|
|
% you probably want to use loadhyph-foo.tex (which will load this file) instead.
|
|
%
|
|
% Modifications were done by Jonathan Kew, Mojca Miklavec & Arthur Reutenauer
|
|
% with help & support from:
|
|
% - Karl Berry, who gave us free hands and all resources
|
|
% - Taco Hoekwater, with useful macros
|
|
% - Hans Hagen, who did the unicodifisation of patterns already long before
|
|
% and helped with testing, suggestions and bug reports
|
|
% - Norbert Preining, who tested & integrated patterns into TeX Live
|
|
%
|
|
% However, the 'copyright/copyleft' owner of patterns remains the original author.
|
|
%
|
|
% The copyright statement of this file is thus:
|
|
%
|
|
% Do with this file whatever needs to be done in future for the sake of
|
|
% 'a better world' as long as you respect the copyright of original file.
|
|
% If you're the original author of patterns or taking over a new revolution,
|
|
% plese remove all of the TUG comments & credits that we added here -
|
|
% you are the Queen / the King, we are only the servants.
|
|
%
|
|
% If you want to change this file, rather than uploading directly to CTAN,
|
|
% we would be grateful if you could send it to us (http://tug.org/tex-hyphen)
|
|
% or ask for credentials for SVN repository and commit it yourself;
|
|
% we will then upload the whole 'package' to CTAN.
|
|
%
|
|
% Before a new 'pattern-revolution' starts,
|
|
% please try to follow some guidelines if possible:
|
|
%
|
|
% - \lccode is *forbidden*, and I really mean it
|
|
% - all the patterns should be in UTF-8
|
|
% - the only 'allowed' TeX commands in this file are: \patterns, \hyphenation,
|
|
% and if you really cannot do without, also \input and \message
|
|
% - in particular, please no \catcode or \lccode changes,
|
|
% they belong to loadhyph-foo.tex,
|
|
% and no \lefthyphenmin and \righthyphenmin,
|
|
% they have no influence here and belong elsewhere
|
|
% - \begingroup and/or \endinput is not needed
|
|
% - feel free to do whatever you want inside comments
|
|
%
|
|
% We know that TeX is extremely powerful, but give a stupid parser
|
|
% at least a chance to read your patterns.
|
|
%
|
|
% For more unformation see
|
|
%
|
|
% http://tug.org/tex-hyphen
|
|
%
|
|
%------------------------------------------------------------------------------
|
|
%
|
|
% ********** lahyph.tex *************
|
|
%
|
|
% Copyright 1999- 2001 Claudio Beccari
|
|
% [latin hyphenation patterns]
|
|
%
|
|
% -----------------------------------------------------------------
|
|
% IMPORTANT NOTICE:
|
|
%
|
|
% This program can be redistributed and/or modified under the terms
|
|
% of the LaTeX Project Public License Distributed from CTAN
|
|
% archives in directory macros/latex/base/lppl.txt; either
|
|
% version 1 of the License, or any later version.
|
|
% -----------------------------------------------------------------
|
|
%
|
|
% Patterns for the latin language mainly in modern spelling
|
|
% (u when u is needed and v when v is needed); medieval spelling
|
|
% with the ligatures \ae and \oe and the (uncial) lowercase `v'
|
|
% written as a `u' is also supported; apparently there is no conflict
|
|
% between the patterns of modern Latin and those of medieval Latin.
|
|
%
|
|
% Support for font encoding OT1 with 128-character set and
|
|
% for font encoding T1 with a 256-character set.
|
|
%
|
|
% Prepared by Claudio Beccari
|
|
% Politecnico di Torino
|
|
% Torino, Italy
|
|
% e-mail beccari@polito.it
|
|
%
|
|
% 1999/03/10 Integration of `lahyph7.tex' and `lahyph8.tex' into
|
|
% one file `lahyph.tex' supporting fonts in OT1 and T1 encoding by
|
|
% Bernd Raichle using the macro code from `dehypht.tex' (this code
|
|
% is Copyright 1993,1994,1998,1999 Bernd Raichle/DANTE e.V.).
|
|
%
|
|
%
|
|
% \versionnumber{3.1} \versiondate{2007/04/16}
|
|
%
|
|
% Information after \endinput.
|
|
%
|
|
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
|
|
%
|
|
% \message{Latin Hyphenation Patterns `lahyph' Version 3.1 <2007/04/16>}
|
|
|
|
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
|
|
%
|
|
% For documentation see:
|
|
% C. Beccari, 'Computer aided hyphenation for Italian and Modern
|
|
% Latin', TUG vol. 13, n. 1, pp. 23-33 (1992)
|
|
%
|
|
% see also
|
|
%
|
|
% C. Beccari, 'Typesetting of ancient languages',
|
|
% TUG vol.15, n.1, pp. 9-16 (1994)
|
|
%
|
|
% In the former paper the code was described as being contained in file
|
|
% ITALAT.TEX; this is substantially the same code, but the file has been
|
|
% renamed LAHYPH.TEX in accordance with the ISO name for Latin and the
|
|
% convention that all hyphenation pattern file names should be formed by the
|
|
% agglutination of two letter language ISO code and the abbreviation HYPH.
|
|
%
|
|
% A corresponding file (ITHYPH.TEX) has been extracted in order to eliminate
|
|
% the (few) patterns specific to Latin and leave those specific to Italian;
|
|
% ITHYPH.TEX has been further extended with many new patterns in order to
|
|
% cope with the many neologisms and technical terms with foreign roots.
|
|
%
|
|
% Should you find any word that gets hyphenated in a wrong way, please, AFTER
|
|
% CHECKING ON A RELIABLE MODERN DICTIONARY, report to the author, preferably
|
|
% by e-mail. Please do not report about wrong break points concerning
|
|
% prefixes and/or suffixes; see at the bottom of this file.
|
|
%
|
|
% Compared with the previous versions, this file has been extended so as to
|
|
% cope also with the medieval Latin spelling, where the letter `V' played the
|
|
% roles of both `U' and `V', as in the Roman times, save that the Romans used
|
|
% only capitals. In the middle ages the availability of soft writing supports
|
|
% and the necessity of copying books with a reasonable speed, several scripts
|
|
% evolved in (practically) all of which there was a lower case alphabet
|
|
% different from the upper case one, and where the lower case `v' had the
|
|
% rounded shape of our modern lower case `u', and where the Latin diphthongs
|
|
% `AE' and `OE', both in upper and lower case, where written as ligatures,
|
|
% not to mention the habit of substituting them with their sound, that is a
|
|
% simple `E'.
|
|
%
|
|
% According to Leon Battista Alberti, who in 1466 wrote a book on
|
|
% cryptography where he thoroughly analyzed the hyphenation of the Latin
|
|
% language of his (still medieval) times, the differences from the Tuscan
|
|
% language (the Italian language, as it was named at his time) were very
|
|
% limited, in particular for what concerns the handling of the ascending and
|
|
% descending diphthongs; in Central and Northern Europe, and later on in
|
|
% North America, the Scholars perceived the above diphthongs as made of two
|
|
% distinct vowels; the hyphenation of medieval Latin, therefore, was quite
|
|
% different in the northern countries compared to the southern ones, at least
|
|
% for what concerns these diphthongs. If you need hyphenation patterns for
|
|
% medieval Latin that suite you better according to the habits of Northern
|
|
% Europe you should resort to the hyphenation patterns prepared by Yannis
|
|
% Haralambous (TUGboat, vol.13 n.4 (1992)).
|
|
%
|
|
%
|
|
%
|
|
% PREFIXES AND SUFFIXES
|
|
%
|
|
% For what concerns prefixes and suffixes, the latter are generally separated
|
|
% according to 'natural' syllabification, while the former are generally
|
|
% divided etimologically. In order to avoid an excessive number of patterns,
|
|
% care has been paid to some prefixes, especially 'ex', 'trans', 'circum',
|
|
% 'prae', but this set of patterns is NOT capable of separating the prefixes
|
|
% in all circumstances.
|
|
%
|
|
% BABEL SHORTCUTS AND FACILITIES
|
|
%
|
|
% Read the documentation coming with the discription of the Latin language
|
|
% interface of Babel in order to see the shortcuts and the facilities
|
|
% introduced in order to facilitate the insertion of 'compound word marks'
|
|
% which are very useful for inserting etimological break points.
|
|
%
|
|
% Happy Latin and multilingual typesetting!
|
|
|
|
|
|
//============================================================================================================
|
|
|
|
*/
|
|
|
|
$patgenLanguage = 'Latin';
|
|
|
|
$patgenExceptions = array();
|
|
|
|
$patgenMaxSeg = 7;
|
|
|
|
$patgen = array(
|
|
'begin'=>array(
|
|
'abl'=>'0230',
|
|
'anti'=>'00001',
|
|
'antimn'=>'0000320',
|
|
'circum'=>'0000021',
|
|
'coniun'=>'0021000',
|
|
'discine'=>'00230000',
|
|
'ex'=>'021',
|
|
'ob'=>'023',
|
|
'parai'=>'000010',
|
|
'parau'=>'000010',
|
|
'sublu'=>'002300',
|
|
'subr'=>'00230'
|
|
),
|
|
'end'=>array(
|
|
'sque'=>'23000',
|
|
'sdem'=>'23000',
|
|
'b'=>'20',
|
|
'c'=>'20',
|
|
'd'=>'20',
|
|
'f'=>'20',
|
|
'g'=>'20',
|
|
'h'=>'20',
|
|
'l'=>'20',
|
|
'm'=>'20',
|
|
'n'=>'20',
|
|
'p'=>'20',
|
|
'r'=>'20',
|
|
's'=>'20',
|
|
'st'=>'200',
|
|
't'=>'20',
|
|
'x'=>'20',
|
|
'z'=>'20'
|
|
),
|
|
'all'=>array(
|
|
'\''=>'22',
|
|
'psic'=>'32000',
|
|
'pneu'=>'32000',
|
|
'æ'=>'01',
|
|
'œ'=>'01',
|
|
'aia'=>'0100',
|
|
'aie'=>'0100',
|
|
'aio'=>'0100',
|
|
'aiu'=>'0100',
|
|
'aea'=>'0010',
|
|
'aeo'=>'0010',
|
|
'aeu'=>'0010',
|
|
'eiu'=>'0100',
|
|
'ioi'=>'0010',
|
|
'oia'=>'0100',
|
|
'oie'=>'0100',
|
|
'oio'=>'0100',
|
|
'oiu'=>'0100',
|
|
'uou'=>'0030',
|
|
'b'=>'10',
|
|
'bb'=>'200',
|
|
'bd'=>'200',
|
|
'bl'=>'020',
|
|
'bm'=>'200',
|
|
'bn'=>'200',
|
|
'br'=>'020',
|
|
'bt'=>'200',
|
|
'bs'=>'200',
|
|
'c'=>'10',
|
|
'cc'=>'200',
|
|
'ch'=>'022',
|
|
'cl'=>'020',
|
|
'cm'=>'200',
|
|
'cn'=>'200',
|
|
'cq'=>'200',
|
|
'cr'=>'020',
|
|
'cs'=>'200',
|
|
'ct'=>'200',
|
|
'cz'=>'200',
|
|
'd'=>'10',
|
|
'dd'=>'200',
|
|
'dg'=>'200',
|
|
'dm'=>'200',
|
|
'dr'=>'020',
|
|
'ds'=>'200',
|
|
'dv'=>'200',
|
|
'f'=>'10',
|
|
'ff'=>'200',
|
|
'fl'=>'020',
|
|
'fn'=>'200',
|
|
'fr'=>'020',
|
|
'ft'=>'200',
|
|
'g'=>'10',
|
|
'gg'=>'200',
|
|
'gd'=>'200',
|
|
'gf'=>'200',
|
|
'gl'=>'020',
|
|
'gm'=>'200',
|
|
'gn'=>'020',
|
|
'gr'=>'020',
|
|
'gs'=>'200',
|
|
'gv'=>'200',
|
|
'h'=>'10',
|
|
'hp'=>'200',
|
|
'ht'=>'200',
|
|
'j'=>'10',
|
|
'k'=>'10',
|
|
'kk'=>'200',
|
|
'kh'=>'022',
|
|
'l'=>'10',
|
|
'lb'=>'200',
|
|
'lc'=>'200',
|
|
'ld'=>'200',
|
|
'lf'=>'200',
|
|
'lft'=>'0320',
|
|
'lg'=>'200',
|
|
'lk'=>'200',
|
|
'll'=>'200',
|
|
'lm'=>'200',
|
|
'ln'=>'200',
|
|
'lp'=>'200',
|
|
'lq'=>'200',
|
|
'lr'=>'200',
|
|
'ls'=>'200',
|
|
'lt'=>'200',
|
|
'lv'=>'200',
|
|
'm'=>'10',
|
|
'mm'=>'200',
|
|
'mb'=>'200',
|
|
'mp'=>'200',
|
|
'ml'=>'200',
|
|
'mn'=>'200',
|
|
'mq'=>'200',
|
|
'mr'=>'200',
|
|
'mv'=>'200',
|
|
'n'=>'10',
|
|
'nb'=>'200',
|
|
'nc'=>'200',
|
|
'nd'=>'200',
|
|
'nf'=>'200',
|
|
'ng'=>'200',
|
|
'nl'=>'200',
|
|
'nm'=>'200',
|
|
'nn'=>'200',
|
|
'np'=>'200',
|
|
'nq'=>'200',
|
|
'nr'=>'200',
|
|
'ns'=>'200',
|
|
'nsm'=>'0230',
|
|
'nsf'=>'0230',
|
|
'nt'=>'200',
|
|
'nv'=>'200',
|
|
'nx'=>'200',
|
|
'p'=>'10',
|
|
'ph'=>'020',
|
|
'pl'=>'020',
|
|
'pn'=>'200',
|
|
'pp'=>'200',
|
|
'pr'=>'020',
|
|
'ps'=>'200',
|
|
'pt'=>'200',
|
|
'pz'=>'200',
|
|
'php'=>'2000',
|
|
'pht'=>'2000',
|
|
'qu'=>'102',
|
|
'r'=>'10',
|
|
'rb'=>'200',
|
|
'rc'=>'200',
|
|
'rd'=>'200',
|
|
'rf'=>'200',
|
|
'rg'=>'200',
|
|
'rh'=>'020',
|
|
'rl'=>'200',
|
|
'rm'=>'200',
|
|
'rn'=>'200',
|
|
'rp'=>'200',
|
|
'rq'=>'200',
|
|
'rr'=>'200',
|
|
'rs'=>'200',
|
|
'rt'=>'200',
|
|
'rv'=>'200',
|
|
'rz'=>'200',
|
|
's'=>'12',
|
|
'sph'=>'2300',
|
|
'ss'=>'230',
|
|
'stb'=>'2000',
|
|
'stc'=>'2000',
|
|
'std'=>'2000',
|
|
'stf'=>'2000',
|
|
'stg'=>'2000',
|
|
'stl'=>'2030',
|
|
'stm'=>'2000',
|
|
'stn'=>'2000',
|
|
'stp'=>'2000',
|
|
'stq'=>'2000',
|
|
'sts'=>'2000',
|
|
'stt'=>'2000',
|
|
'stv'=>'2000',
|
|
't'=>'10',
|
|
'tb'=>'200',
|
|
'tc'=>'200',
|
|
'td'=>'200',
|
|
'tf'=>'200',
|
|
'tg'=>'200',
|
|
'th'=>'020',
|
|
'tl'=>'020',
|
|
'tr'=>'020',
|
|
'tm'=>'200',
|
|
'tn'=>'200',
|
|
'tp'=>'200',
|
|
'tq'=>'200',
|
|
'tt'=>'200',
|
|
'tv'=>'200',
|
|
'v'=>'10',
|
|
'vl'=>'020',
|
|
'vr'=>'020',
|
|
'vv'=>'200',
|
|
'x'=>'10',
|
|
'xt'=>'200',
|
|
'xx'=>'200',
|
|
'z'=>'10',
|
|
'aua'=>'0100',
|
|
'aue'=>'0100',
|
|
'aui'=>'0100',
|
|
'auo'=>'0100',
|
|
'auu'=>'0100',
|
|
'eua'=>'0100',
|
|
'eue'=>'0100',
|
|
'eui'=>'0100',
|
|
'euo'=>'0100',
|
|
'euu'=>'0100',
|
|
'iua'=>'0100',
|
|
'iue'=>'0100',
|
|
'iui'=>'0100',
|
|
'iuo'=>'0100',
|
|
'iuu'=>'0100',
|
|
'oua'=>'0100',
|
|
'oue'=>'0100',
|
|
'oui'=>'0100',
|
|
'ouo'=>'0100',
|
|
'ouu'=>'0100',
|
|
'uua'=>'0100',
|
|
'uue'=>'0100',
|
|
'uui'=>'0100',
|
|
'uuo'=>'0100',
|
|
'uuu'=>'0100',
|
|
'alua'=>'02100',
|
|
'alue'=>'02100',
|
|
'alui'=>'02100',
|
|
'aluo'=>'02100',
|
|
'aluu'=>'02100',
|
|
'elua'=>'02100',
|
|
'elue'=>'02100',
|
|
'elui'=>'02100',
|
|
'eluo'=>'02100',
|
|
'eluu'=>'02100',
|
|
'ilua'=>'02100',
|
|
'ilue'=>'02100',
|
|
'ilui'=>'02100',
|
|
'iluo'=>'02100',
|
|
'iluu'=>'02100',
|
|
'olua'=>'02100',
|
|
'olue'=>'02100',
|
|
'olui'=>'02100',
|
|
'oluo'=>'02100',
|
|
'oluu'=>'02100',
|
|
'ulua'=>'02100',
|
|
'ulue'=>'02100',
|
|
'ului'=>'02100',
|
|
'uluo'=>'02100',
|
|
'uluu'=>'02100',
|
|
'amua'=>'02100',
|
|
'amue'=>'02100',
|
|
'amui'=>'02100',
|
|
'amuo'=>'02100',
|
|
'amuu'=>'02100',
|
|
'emua'=>'02100',
|
|
'emue'=>'02100',
|
|
'emui'=>'02100',
|
|
'emuo'=>'02100',
|
|
'emuu'=>'02100',
|
|
'imua'=>'02100',
|
|
'imue'=>'02100',
|
|
'imui'=>'02100',
|
|
'imuo'=>'02100',
|
|
'imuu'=>'02100',
|
|
'omua'=>'02100',
|
|
'omue'=>'02100',
|
|
'omui'=>'02100',
|
|
'omuo'=>'02100',
|
|
'omuu'=>'02100',
|
|
'umua'=>'02100',
|
|
'umue'=>'02100',
|
|
'umui'=>'02100',
|
|
'umuo'=>'02100',
|
|
'umuu'=>'02100',
|
|
'anua'=>'02100',
|
|
'anue'=>'02100',
|
|
'anui'=>'02100',
|
|
'anuo'=>'02100',
|
|
'anuu'=>'02100',
|
|
'enua'=>'02100',
|
|
'enue'=>'02100',
|
|
'enui'=>'02100',
|
|
'enuo'=>'02100',
|
|
'enuu'=>'02100',
|
|
'inua'=>'02100',
|
|
'inue'=>'02100',
|
|
'inui'=>'02100',
|
|
'inuo'=>'02100',
|
|
'inuu'=>'02100',
|
|
'onua'=>'02100',
|
|
'onue'=>'02100',
|
|
'onui'=>'02100',
|
|
'onuo'=>'02100',
|
|
'onuu'=>'02100',
|
|
'unua'=>'02100',
|
|
'unue'=>'02100',
|
|
'unui'=>'02100',
|
|
'unuo'=>'02100',
|
|
'unuu'=>'02100',
|
|
'arua'=>'02100',
|
|
'arue'=>'02100',
|
|
'arui'=>'02100',
|
|
'aruo'=>'02100',
|
|
'aruu'=>'02100',
|
|
'erua'=>'02100',
|
|
'erue'=>'02100',
|
|
'erui'=>'02100',
|
|
'eruo'=>'02100',
|
|
'eruu'=>'02100',
|
|
'irua'=>'02100',
|
|
'irue'=>'02100',
|
|
'irui'=>'02100',
|
|
'iruo'=>'02100',
|
|
'iruu'=>'02100',
|
|
'orua'=>'02100',
|
|
'orue'=>'02100',
|
|
'orui'=>'02100',
|
|
'oruo'=>'02100',
|
|
'oruu'=>'02100',
|
|
'urua'=>'02100',
|
|
'urue'=>'02100',
|
|
'urui'=>'02100',
|
|
'uruo'=>'02100',
|
|
'uruu'=>'02100'
|
|
)
|
|
);
|
|
|
|
?>
|