• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1%
2%                  ********** lahyph.tex *************
3%
4% Copyright 1999- 2001 Claudio Beccari
5%                [latin hyphenation patterns]
6%
7% -----------------------------------------------------------------
8% IMPORTANT NOTICE:
9%
10% This program can be redistributed and/or modified under the terms
11% of the LaTeX Project Public License Distributed from CTAN
12% archives in directory macros/latex/base/lppl.txt; either
13% version 1 of the License, or any later version.
14% -----------------------------------------------------------------
15%
16% Patterns for the latin language mainly in modern spelling
17% (u when u is needed and v when v is needed); medieval spelling
18% with the ligatures \ae and \oe  and the (uncial) lowercase `v'
19% written as a `u' is also supported; apparently there is no conflict
20% between the patterns of modern  Latin and those of medieval Latin.
21%
22% Support for font encoding OT1 with 128-character set and
23% for font encoding T1 with a 256-character set.
24%
25% Prepared by  Claudio Beccari
26%              Politecnico di Torino
27%              Torino, Italy
28%              e-mail beccari@polito.it
29%
30% 1999/03/10 Integration of `lahyph7.tex' and `lahyph8.tex' into
31% one file `lahyph.tex' supporting fonts in OT1 and T1 encoding by
32% Bernd Raichle using the macro code from `dehypht.tex' (this code
33% is Copyright 1993,1994,1998,1999 Bernd Raichle/DANTE e.V.).
34%
35%
36% \versionnumber{3.1}   \versiondate{2007/04/16}
37%
38% Information after \endinput.
39%
40%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
41%
42\message{Latin Hyphenation Patterns `lahyph' Version 3.1 <2007/04/16>}
43%
44%
45% Next we define some commands which are used inside the patterns.
46% To keep them local, we enclose the rest of the file in a group
47% (The \patterns command globally changes the hyphenation trie!).
48% These initial commands are by Bernd Raichle (see above)
49%
50\begingroup
51%
52% Make sure that doublequote is not active:
53\catcode`\"=12
54%
55%
56% Ligatures \ae and \oe in font encoding OT1
57%
58\catcode"1A=11 \lccode"1A="1A % \ae (^^Z)
59\catcode"1D=11 \lccode"1D="1D % \AE (^^]) (not used)
60\catcode"1B=11 \lccode"1B="1B % \oe (^^[)
61\catcode"1E=11 \lccode"1E="1E % \OE (^^^) (not used)
62%
63% Define \ae and \oe as shorthands for medieval latin
64% ligatures in font encoding OT1:
65\def\ae{^^Z}
66\def\oe{^^[}
67%
68%
69% Then we have to define some macros depending on the TeX version.
70% Therefore we have to distinguish TeX version 2.x and 3.x:
71%
72\ifnum`\@=`\^^40 % true => TeX 3.x
73  %
74  % For TeX 3:
75  % ----------
76  %
77  % Ligatures \ae and \oe in font encoding T1
78  %
79  \catcode"E6=11 \lccode"E6="E6 % \ae
80  \catcode"C6=11 \lccode"C6="E6 % \AE (not used)
81  \catcode"F7=11 \lccode"F7="F7 % \oe
82  \catcode"D7=11 \lccode"D7="F7 % \OE (not used)
83  %
84  % Ligatures \ae and \oe in font encoding T1 are ok:
85  \def\n#1{#1}
86  %
87  % In the following definitions we use ??xy instead of ^^xy
88  % to avoid errors when reading the macro definitions with
89  % TeX 2.x (remember ^^e(6) is the comment character):
90  %
91  \catcode`\?=7
92  %
93  % Define \a and \o to be \ae resp. \oe in font encoding T1:
94  \def\a{??e6} % \ae
95  \def\o{??f7} % \oe
96  %
97  \catcode`\?=12
98  %
99\else
100  %
101  % For TeX 2:
102  % ----------
103  %
104  % Ignore ligatures \ae and \oe in font encoding T1:
105  \def\n#1{}
106  %
107  % Define \a and \o (= \ae, \oe in font encoding T1) to
108  % signal an error:
109  \def\a{\errmessage{Hyphenation pattern file corrupted!}}
110  \def\o{\errmessage{Hyphenation pattern file corrupted!}}
111  %
112\fi
113%
114%
115\lccode`'=`'
116\patterns{%
1172'2
118.a2b3l
119.anti1  .anti3m2n
120.circu2m1
121.co2n1iun
122.di2s3cine
123.e2x1
124.o2b3                                % .o2b3l  .o2b3r .o2b3s
125.para1i  .para1u
126.su2b3lu .su2b3r
1272s3que.  2s3dem.
1283p2sic
1293p2neu
130\ae1 \oe1                            % Ligatures ae and oe (in OT1)
131\n{\a1} \n{\o1}                      % Ligatures ae and oe (in T1)
132a1ia a1ie  a1io  a1iu ae1a ae1o ae1u
133e1iu
134io1i
135o1ia o1ie  o1io  o1iu
136uo3u                                % quousque
1371b   2bb   2bd   b2l   2bm  2bn  b2r  2bt  2bs  2b.
1381c   2cc   c2h2  c2l   2cm  2cn  2cq  c2r  2cs  2ct  2cz  2c.
1391d   2dd   2dg   2dm   d2r  2ds  2dv  2d.
1401f   2ff   f2l   2fn   f2r  2ft  2f.
1411g   2gg   2gd   2gf   g2l  2gm  g2n  g2r  2gs  2gv  2g.
1421h   2hp   2ht   2h.
1431j
1441k   2kk   k2h2
1451l   2lb   2lc   2ld   2lf  l3f2t 2lg 2lk  2ll  2lm  2ln  2lp  2lq  2lr
146     2ls   2lt   2lv   2l.
1471m   2mm   2mb   2mp   2ml  2mn  2mq  2mr  2mv  2m.
1481n   2nb   2nc   2nd   2nf  2ng  2nl  2nm  2nn  2np  2nq  2nr  2ns
149     n2s3m n2s3f 2nt   2nv  2nx  2n.
1501p   p2h   p2l   2pn   2pp  p2r  2ps  2pt  2pz  2php 2pht 2p.
1511qu2
1521r   2rb   2rc   2rd   2rf  2rg  r2h  2rl  2rm  2rn  2rp  2rq  2rr  2rs  2rt
153     2rv   2rz   2r.
1541s2  2s3ph 2s3s  2stb  2stc 2std 2stf 2stg 2st3l     2stm 2stn 2stp 2stq
155     2sts  2stt  2stv  2s.  2st.
1561t   2tb   2tc   2td   2tf  2tg  t2h  t2l  t2r  2tm  2tn  2tp  2tq  2tt
157     2tv   2t.
1581v   v2l   v2r   2vv
1591x   2xt   2xx   2x.
1601z   2z.
161% For medieval Latin
162a1ua a1ue a1ui a1uo a1uu
163e1ua e1ue e1ui e1uo e1uu
164i1ua i1ue i1ui i1uo i1uu
165o1ua o1ue o1ui o1uo o1uu
166u1ua u1ue u1ui u1uo u1uu
167%
168a2l1ua a2l1ue a2l1ui a2l1uo a2l1uu
169e2l1ua e2l1ue e2l1ui e2l1uo e2l1uu
170i2l1ua i2l1ue i2l1ui i2l1uo i2l1uu
171o2l1ua o2l1ue o2l1ui o2l1uo o2l1uu
172u2l1ua u2l1ue u2l1ui u2l1uo u2l1uu
173%
174a2m1ua a2m1ue a2m1ui a2m1uo a2m1uu
175e2m1ua e2m1ue e2m1ui e2m1uo e2m1uu
176i2m1ua i2m1ue i2m1ui i2m1uo i2m1uu
177o2m1ua o2m1ue o2m1ui o2m1uo o2m1uu
178u2m1ua u2m1ue u2m1ui u2m1uo u2m1uu
179%
180a2n1ua a2n1ue a2n1ui a2n1uo a2n1uu
181e2n1ua e2n1ue e2n1ui e2n1uo e2n1uu
182i2n1ua i2n1ue i2n1ui i2n1uo i2n1uu
183o2n1ua o2n1ue o2n1ui o2n1uo o2n1uu
184u2n1ua u2n1ue u2n1ui u2n1uo u2n1uu
185%
186a2r1ua a2r1ue a2r1ui a2r1uo a2r1uu
187e2r1ua e2r1ue e2r1ui e2r1uo e2r1uu
188i2r1ua i2r1ue i2r1ui i2r1uo i2r1uu
189o2r1ua o2r1ue o2r1ui o2r1uo o2r1uu
190u2r1ua u2r1ue u2r1ui u2r1uo u2r1uu
191%
192%
193}
194\endgroup
195%
196\endinput
197%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
198
199 For documentation see:
200 C. Beccari, "Computer aided hyphenation for Italian and Modern
201       Latin", TUG vol. 13, n. 1, pp. 23-33 (1992)
202
203 see also
204
205 C. Beccari, "Typesetting of ancient languages",
206             TUG vol.15, n.1, pp. 9-16 (1994)
207
208 In the former paper  the  code  was  described  as  being contained in file
209 ITALAT.TEX; this is substantially the same code,  but  the  file  has  been
210 renamed  LAHYPH.TEX  in  accordance  with  the  ISO  name for Latin and the
211 convention that all hyphenation pattern file  names should be formed by the
212 agglutination of two letter language ISO code and the abbreviation HYPH.
213
214 A corresponding file (ITHYPH.TEX) has been extracted in order to  eliminate
215 the  (few)  patterns specific to Latin and leave those specific to Italian;
216 ITHYPH.TEX has been further  extended  with  many  new patterns in order to
217 cope with the many neologisms and technical terms with foreign roots.
218
219 Should you find any word that gets hyphenated in a wrong way, please, AFTER
220 CHECKING  ON A RELIABLE MODERN DICTIONARY, report to the author, preferably
221 by e-mail.  Please  do  not  report  about  wrong  break  points concerning
222 prefixes and/or suffixes; see at the bottom of this file.
223
224 Compared with the previous versions, this file has been extended so  as  to
225 cope also with the medieval Latin spelling, where the letter `V' played the
226 roles of both `U' and `V', as in the Roman times, save that the Romans used
227 only capitals. In the middle ages the availability of soft writing supports
228 and the necessity of copying books with a reasonable speed, several scripts
229 evolved  in  (practically)  all  of  which  there was a lower case alphabet
230 different from the upper case  one,  and  where  the lower case `v' had the
231 rounded shape of our modern lower case `u', and where the Latin  diphthongs
232 `AE'  and  `OE',  both in upper and lower case, where written as ligatures,
233 not to mention the habit of  substituting  them with their sound, that is a
234 simple `E'.
235
236 According  to  Leon  Battista  Alberti,  who  in  1466  wrote  a  book   on
237 cryptography  where  he  thoroughly  analyzed  the hyphenation of the Latin
238 language of his (still  medieval)  times,  the  differences from the Tuscan
239 language (the Italian language, as it was named  at  his  time)  were  very
240 limited,  in particular for what concerns the handling of the ascending and
241 descending diphthongs; in  Central  and  Northern  Europe,  and later on in
242 North America, the Scholars perceived the above diphthongs as made  of  two
243 distinct  vowels;  the  hyphenation of medieval Latin, therefore, was quite
244 different in the northern countries compared to the southern ones, at least
245 for what concerns these  diphthongs.  If  you need hyphenation patterns for
246 medieval Latin that suite you better according to the  habits  of  Northern
247 Europe  you  should  resort  to the hyphenation patterns prepared by Yannis
248 Haralambous (TUGboat, vol.13 n.4 (1992)).
249
250
251
252                           PREFIXES AND SUFFIXES
253
254For what concerns prefixes and suffixes, the latter are generally  separated
255according  to  "natural"  syllabification,  while  the  former are generally
256divided etimologically. In order to  avoid  an excessive number of patterns,
257care has been paid to some prefixes,  especially  "ex",  "trans",  "circum",
258"prae",  but  this set of patterns is NOT capable of separating the prefixes
259in all circumstances.
260
261                        BABEL SHORTCUTS AND FACILITIES
262
263Read  the  documentation  coming  with the discription of the Latin language
264interface of  Babel  in  order  to  see  the  shortcuts  and  the facilities
265introduced in order to facilitate the insertion  of  "compound  word  marks"
266which are very useful for inserting etimological break points.
267
268Happy Latin and multilingual typesetting!
269