comparison DESpecs/DESpecs_chinese.tex @ 14:c3c84bdd1fdd

Chinesische Version und XML-Version hinzugef?gt
author Klaus Thoden <kthoden@mpiwg-berlin.mpg.de>
date Thu, 02 May 2013 11:38:23 +0200
parents
children b2bcb3f68258
comparison
equal deleted inserted replaced
13:facea8c79160 14:c3c84bdd1fdd
1 %!TEX TS-program = xelatex
2 %!TEX encoding = UTF-8 Unicode
3
4 \documentclass[fontsize=11pt, paper=a4,
5 DIV15,
6 headings=normal,
7 parskip=half-,
8 numbers=noenddot]{scrartcl}
9
10 \usepackage[british]{babel}
11
12 \usepackage{fontspec,xltxtra,xunicode}
13 \defaultfontfeatures{Mapping=tex-text}
14
15 \setromanfont[Mapping=tex-text]{DejaVu Serif}
16 \setsansfont[Scale=MatchLowercase,Mapping=tex-text]{Helvetica}
17 \setmonofont[Scale=1.0]{Courier New}
18
19 \frenchspacing
20
21 \usepackage{graphicx}
22 \graphicspath{{../../bilder/chinese/}}
23
24 \usepackage{longtable}
25
26 %%%
27
28 \input{../../abbreviations/abbreviations_2}
29
30 \newcommand{\hash}{{\char"0023}}
31 \newenvironment{typeChinese}{\begin{alltt}\s\begin{tabular}{@{}l}}{\end{tabular}\end{alltt}}
32
33 \newcommand{\chin}[1]{{\fontspec{Sun-ExtA}{#1}}}
34 \newcommand{\sunExtA}[1]{{\fontspec{Sun-ExtA}{#1}}}
35 \newcommand{\sunExtB}[1]{{\fontspec{Sun-ExtB}{#1}}}
36 \newcommand{\extB}[1]{{\fontspec{Sun-ExtB}{#1}}}
37
38 \newcommand{\mincho}[1]{{\fontspec{MS Mincho}{#1}}}
39 \newcommand{\hira}[1]{{\fontspec{HiraMinPro-W3}{#1}}}
40
41 % Verkürzung von \bold und \chin:
42 % schon vorhanden: ch, c, s; b, bf
43 % noch nicht vorhanden: sun (bringt aber nicht viel)
44 \newcommand{\f}[1]{\bold{#1}} % f für fett
45 \newcommand{\z}[1]{\chin{#1}} % z für Zeichen
46
47 %%%
48
49 \begin{document}
50
51 \begin{center}
52 {\fontspec{Helvetica}{\LARGE \textbf{
53 Data Entry Specs for Chinese Text }}} \\[5mm]
54 \large Wolfgang Schmidle, Martina Siebert, \\[1mm]
55 Martin Hofmann, Klaus Thoden, Malcolm D. Hyman
56
57 \normalsize Max Planck Institute for the History of Science, Berlin, Germany
58
59 Version 2.1 \\[1mm]
60 \today
61 \end{center}
62
63 \tableofcontents
64
65 \newpage
66
67 \section{File Conventions}
68 \label{section file conventions}
69
70 \begin{mainrule}
71 Save the text in plain text format (§.txt§) with Unicode §utf-8§ encoding. If the text is saved in more than one file, number the parts, for example §Euclid_part_001.txt§, §Euclid_part_002.txt§, and so on. Create a §zip§ archive of all files.
72 \end{mainrule}
73
74 \begin{mainrule}
75 Make use of the complete character repertoire found in Unicode version 5.1.
76 \end{mainrule}
77
78 \begin{clarification}
79 This includes characters in the following Unicode blocks when applicable:
80
81 \begin{itemize}
82 \item CJK Unified Ideographs Extension A (U+3400 -- U+4DFF)
83 \item CJK Unified Ideographs Extension B (U+20000 -- U+2A6DF)
84 %\item CJK Compatibility Ideographs Supplement (U+2F800 -- U+2FA1F)
85 \end{itemize}
86 At this point, do not make use of the characters in Extension C or D.
87 \end{clarification}
88
89 \begin{mainrule}
90 We will also need the list of unknown characters (see \sect{section unknown characters}) and the list of character variants (see \sect{section character variants}). Please send each list in two versions, namely in the original file format (e.g. RTF, DOC, XLS) and as PDF. If the lists are handwritten, scan them and save them as PDF files.
91 \end{mainrule}
92
93
94 \section{General Markup}
95
96 \begin{mainrule}
97 Type the entire contents of one page, then go on to the next page. Do not mix the contents of different pages.
98 \end{mainrule}
99
100 \tocspace
101 \subsection{Page Breaks, Page Numbers and Running Heads}
102
103 \label{section page breaks}
104
105 \begin{mainrule}
106 Page breaks are marked by §<pb>§. If the page has a page number, type it within the §<pb>§ tag, e.g. §<pb §\z{六}§>§. Type the page number exactly as it appears in the book. If there is a running head on the page, it is marked by §<rh>§ and §</rh>§. Type the running head immediately after the §<pb>§ tag.
107 \end{mainrule}
108
109 \begin{clarification}
110 Type the §<pb>§ and §<rh>§ tags before you type any page content.
111 \end{clarification}
112
113 \begin{mainrule}
114 The centre section of a traditional printing page (\emph{banxin} \z{版心}) is equivalent to a running head in a western book layout. In this case, repeat §<pb>§ and the running head for each half-page, but add §a§ and §b§ to the page number, e.g. §<pb §\z{三}§a>§ and §<pb §\z{三}§b>§, or §<pb a>§ and §<pb b>§ if there is no page number.
115 \end{mainrule}
116
117 \begin{clarification}
118 If the characters of the running head are cut off on the scanned page, type them anyway. Type large spaces in the running head as a single IDEOGRAPHIC SPACE character U+3000.
119 \end{clarification}
120
121 \begin{note}
122 In the digitization of the book, the two half-pages may be on the same scan or on two consecutive scans.
123 \end{note}
124
125 \begin{tabular}{@{}ll}
126 \parbox[b]{116mm}{
127 \htsc{Examples} \\[18mm]
128 \begin{typeChinese}
129 \f{<pb} \z{三十二}\f{a><rh>}\z{泰西事物}\f{<}\z{起}\f{V>}\z{原 第十一章}\f{</rh>} \\
130 \\
131 \f{<pb} \z{十二}\f{a><rh>}\z{事物攷辨卷之六十三 }\f{<sm>}\z{植物}\f{</sm>}\z{ 帶經堂}\f{</rh>} \\
132 \\
133 \f{<pb} \z{一}\f{a><rh>}\z{閩產}\f{<}\z{錄}\f{V>}\z{異 卷一}\f{<sm>}\z{穀屬}\f{</sm></rh>} \\
134 \\
135 \f{<pb} \z{一}\f{b><rh>}\z{閩產錄異 卷一}\f{<sm>}\z{穀屬}\f{</sm></rh>} \\[18mm]
136 \end{typeChinese}}
137 &
138 \includegraphics[height=8cm]{chinese_rh_1} \qquad
139 \includegraphics[height=8cm]{chinese_rh_2} \qquad
140 \includegraphics[height=8cm]{chinese_rh_3a} \qquad
141 \includegraphics[height=8cm]{chinese_rh_3b}
142 \end{tabular}
143
144 \vspace{3mm}
145 \begin{crossref}
146 For §<sm>§ see \sect{section chinese small characters}. An example of two complete half-pages with their running heads can be seen in \sect{section chinese paragraphs}.
147 \end{crossref}
148
149 \begin{note}
150 For §< V>§ (i.e. marking character variants which are not included in Unicode 5.1) see \sect{section character variants}.
151 \end{note}
152
153
154 \tocspace
155 \subsection{Text Blocks}
156
157 \begin{mainrule}
158 Type a return after each line of the printed page.
159 \end{mainrule}
160
161 \begin{clarification}
162 Do not insert a space at the end of the line.
163 \end{clarification}
164
165
166
167 \subsubsection{Headings}
168 \label{section chinese headings}
169
170 \begin{mainrule}
171 Headings are marked by §<h> </h>§. If you can identify a heading as the book title, use §<ti>§ for the whole line. If you can identify a heading as the name of the author, compilator, proofreader etc. (\emph{ti} \z{題}), use §<ti>§ too. If a text has different levels of headings, use §<h 1>§ for all headings on the highest level, §<h 2>§ for all headings on the second highest level, and so on.
172 \end{mainrule}
173
174 \begin{clarification}
175 If a heading, book title, author, etc. is indented, do not mark this. Type large spaces in the heading as a single IDEOGRAPHIC SPACE character U+3000.
176 \end{clarification}
177
178 %\begin{note}
179 %Typically, a book has at most three different heading levels, i.e. §<h 1>§, §<h 2>§ and §<h 3>§.
180 %\end{note}
181
182
183 %\begin{example} % Text 17-1, p.11; Text 14, p.74
184
185 \begin{tabular}{@{}ll}
186 \parbox[b]{131mm}{
187 \htsc{Example} \\[3mm]
188 \begin{typeChinese}
189 \f{<ti>}\z{閩產}\f{<}\z{錄}\f{V>}\z{異卷一}\f{</ti>} \\
190 \f{<stamp>} \\
191 \f{<ti>}\z{侯官郭柏}\f{<}\z{蒼}\f{R><}\z{蒹}\f{R>}\z{秋輯}\f{</ti>} \\
192 \f{<h 1>}\z{穀屬}\f{</h>} \\
193 \f{<h 2>}\z{早占城晚占城}\f{</h>}\z{ }\f{<p>}\z{有赤白二種宋真宗以福建田多高} \\
194 \z{仰聞占城稻耐旱遣使求其種得二十石以遺閩農} \\
195 \z{今延建邵福甯龍巖種者尚少餘則徧種矣各郡}\f{<}\z{縣}\f{V>} \\
196 ... \f{</p>} \\
197 \f{<h 2>} ... \f{</h>}\z{ }\f{<p>} ... \\
198 ... \f{</p>} \\[20mm]
199 \end{typeChinese}
200 } &
201 \includegraphics[height=8cm]{text17-1p11}
202 \end{tabular}
203
204 \vspace{-8mm}
205 \begin{crossref}
206 For §<stamp>§ see \sect{section chinese stamps}. For §<p>§ see \sect{section chinese paragraphs}.
207 \end{crossref}
208
209 \vspace{5mm}
210 \begin{note}
211 In the transcription of this example, there are three headings on two different levels (§<h 1>§, §<h 2>§, §<h 2>§). In the example in \sect{section chinese paragraphs} there are two headings, both on level 2 (§<h 2>§, §<h 2>§). §<h 1>§ appears on other pages of the book.
212 \end{note}
213
214 %\begin{note}
215 %In this example, the base line for indentation (see \sect{section chinese paragraphs}) would be one character below the printing frame.
216 %\end{note}
217
218 %(We do not make them mark “Sperrung” in book titles.)
219
220
221 \subsubsection{Paragraphs}
222 \label{section chinese paragraphs}
223
224 \begin{mainrule}
225 Paragraphs are marked by §<p>§ and §</p>§. Indented paragraphs are marked by one or more §i§, e.g. §<p iii>§ for a paragraph that is indented by three character spaces. Outdented paragraphs are marked by one or more §x§, e.g. §<p x>§.
226 \end{mainrule}
227
228 \begin{clarification}
229 Every part of the book has a base line where all unindented paragraphs start. The base lines in the preface or table of contents may be different from the base line in the main text. Mark indentations relative to the base line. The indentation symbols §i§ and §x§ always refer to the first line of the paragraph. The remaining lines of the paragraph may have the same or a different indentation, which is not marked. If a paragraph is preceded by a sub-heading in the same line, as in the example in \sect{section chinese headings}, do not mark the indentation at all.
230 \end{clarification}
231
232 \begin{clarification}
233 Make sure that for each §<p>§ there is a corresponding §</p>§ somewhere. If a paragraph starts and ends on different pages, the §<p>§ and §</p>§ tags are on these different pages.
234 \end{clarification}
235
236 \begin{tabular}{@{}ll}
237 \parbox[b]{29.5mm}{
238 \htsc{Example} \\[80mm]
239 } &
240 \includegraphics[height=9cm]{text14p74_neu} \quad
241 \includegraphics[height=9cm]{text14p73}
242 \end{tabular}
243
244 \begin{typeChinese}
245 \f{<pb} \z{三十}\f{a><rh>}\z{泰西事物}\f{<}\z{起}\f{V>}\z{原 }\f{<sm>}\z{第十一章}\f{</sm></rh>} \\
246 \z{之水。蒸滊機關之供於實用。以此爲嚆矢。其後十八世}\f{<}\z{紀}\f{R>}\z{之初。}\f{<dl>}\z{古剌斯哥}\f{</dl>}\z{大學教} \\
247 \z{授}\f{<sl>}\z{鳥可曼}\f{</sl>}\z{復改良蒸汽機。然}\f{<sl>}\z{沙威利}\f{</sl>}\z{及鳥可曼之機械。乃以火氣之壓力。推水上} \\
248 \z{之方法。其蒸氣只不}\f{<}\z{過}\f{RV>}\z{使交互造成眞空耳。故與其謂之蒸氣機。寧謂之空氣機} \\
249 \z{也。}\f{</p>} \\
250 \f{<p>}\z{眞蒸氣機。至一千七百六十四年。英人}\f{<sl><}\z{滑}\f{V></sl>}\z{始發明之。是完全之蒸氣機也。} \\
251 \f{<sl>}\z{滑}\f{</sl>}\z{之蒸氣機。乃低度機也。其後英人}\f{<sl>}\z{他撇}\f{</sl>}\z{復創作高底機。}\f{<sl>}\z{披京}\f{</sl>}\z{改良之。}\f{</p>} \\
252 \f{<h 2>}\z{滊船}\f{</h>} \\
253 \f{<p>}\z{據前頃所揭。始造滊船者。乃西班牙之海軍士官}\f{<sl>}\z{家勒}\f{</sl>}\z{也。然此事似難}\f{<}\z{置}\f{V>}\z{信。且其} \\
254 \z{滊船非供實際之用者。故姑置之不論。滊船之發明者。實乃}\f{<sl>}\z{夫耳頓}\f{</sl>}\z{也。夫耳頓者。} \\
255 \z{合衆國人。自一千七百九十七年時。謀策創作滊船之事。至一千八百七年八月} \\
256 \z{四日。始以其製成滊船『古力亞門』號。放於}\f{<dl>}\z{哈德孫}\f{</dl>}\z{河上。往復於}\f{<dl>}\z{紐育}\f{</dl>}\z{及}\f{<dl>}\z{亞耳巴} \\
257 \z{尼}\f{</dl>}\z{之間。是爲滊船航海之嚆矢。}\f{</p>} \\
258 \\
259 \f{<pb} \z{三十}\f{b><rh>}\z{泰西事物起原 }\f{<sm>}\z{第十一章}\f{</sm></rh>} \\
260 \f{<p i>}\z{英人}\f{<sl>}\z{司民}\f{</sl>}\z{頓。曾於一千七百八十九年。創作滊船。長六十英尺。往復於}\f{<dl>}\z{科斯}\f{</dl>}\z{及} \\
261 \f{<dl>}\z{古禮}\f{</dl>}\z{德運河之間。是第三回試驗也。據此觀之。則}\f{<sl>}\z{司民頓}\f{</sl>}\z{之發明本先於}\f{<sl>}\z{夫} \\
262 \z{耳}\f{</sl>}\z{頓。但不幸未見十分成功。而司民頓死亡。今載澀江保所譯之『萬國發} \\
263 \z{明家列傳』之一節以供參考。}\f{</p>} \\
264 \f{<p iii>}\z{據英國發兌之諸書。}\f{<sl>}\z{司民}\f{</sl>}\z{頓。當由}\f{<dl>}\z{科斯}\f{</dl>}\z{河試航於}\f{<sl>}\z{古蘭毋斯}\f{</sl>}\z{之際。一日有} \\
265 \z{敏捷}\f{<}\z{伶}\f{V>}\z{俐之外人。來求面會}\f{<sl>}\z{司}\f{</sl>}\z{氏。}\f{<sl>}\z{司民頓}\f{</sl>}\z{爲人温厚不設城壁。應來客之} \\
266 \z{扣。而說明其機關之詳細。不圖此外人卽夫}\f{<sl>}\z{耳頓}\f{</sl>}\z{也。夫耳頓得盡叩其端} \\
267 \z{委。乃藉之以爲自己發明之端}\f{<}\z{緖}\f{R>}\z{云。此事未知果否。}\f{</p>} \\
268 \f{<h 2>}\z{船}\f{</h>} \\
269 \f{<p>}\z{創世紀云『諾亞當洪水時以松木爲方舟』。其方舟長三百喬別}\f{<sm>}\z{每喬別}\f{<}\z{約}\f{V>}\z{長}\f{\bs\bs}\z{十八英寸}\f{<sm>}\z{ }\f{<}\z{廣}\f{V>} \\
270 \z{五十喬別。高三十喬別。中造房。以瀝靑塗其內外。及有導光牖。又方舟分爲三層。} \\
271 \z{曰下牀二樓。三樓。此乃船之最古者也。但獨木船則彼石器時代之人。亦}\sunExtA{既}\z{能造} \\
272 \end{typeChinese}
273
274 %\vspace{-2mm}
275 \begin{crossref}
276 For §<sm>§ see \sect{section chinese small characters}. For §<sl>§ and §<dl>§ see \sect{section chinese underlinings}.
277 \end{crossref}
278
279 \vspace{3mm}
280 \begin{note}
281 For the marking of character variants (§< V>§, §< R>§, §< RV>§) see \sect{section character variants}. Only the first appearance of each character variant is marked. For instance, \z{起} is marked in the first running head but not in the second one.
282 % The two half-pages are treated as if they were the beginning of the text. Consequently, \z{起} is marked even though it already appears on earlier pages.
283 (In addition, every example in the Data Entry Specs is treated as if it was the beginning of a text, i.e. \z{起} is marked on the first half-page even though it already appears on earlier pages of the text.)
284 \end{note}
285
286
287 \tocspace
288 \subsection{Structured Text}
289 \label{section structured text}
290
291 \subsubsection{Tables}
292 \label{section tables}
293
294 \begin{mainrule}
295 A table is marked by §<tb>§ and §</tb>§. Use §#§ as field separators. Type a return after each row. Do not type horizontal or vertical lines.
296 \end{mainrule}
297
298 \begin{clarification}
299 Type the §<tb>§ and §</tb>§ tags on separate lines. Do not mark indentations. The field separators may be lines or large spaces.
300 \end{clarification}
301
302 \begin{clarification}
303 If you can identify a single space within a name etc. as a decorative space to make the table layout optically more pleasing, do not type it.
304 \end{clarification}
305
306 \vspace{3mm}
307 \begin{tabular}{@{}ll}
308 \parbox[b]{88mm}{
309 \htsc{Example} \\
310 \begin{typeChinese}
311 \f{<p>}\z{今日諸國所用文字之數如左}\f{</p>} \\
312 \f{<tb>} \\
313 \z{英吉利} \f{\hash} \z{二十六} \\
314 \z{法蘭西} \f{\hash} \z{二十三} \\
315 \z{西班牙} \f{\hash} \z{二十七} \\
316 \z{希臘} \f{\hash} \z{二十四} \\
317 \z{斯格拉}\f{<}\z{窩}\f{V>}\z{尼亞} \f{\hash} \z{二十七} \\
318 \z{德意志} \f{\hash} \z{二十六} \\
319 \z{意大利} \f{\hash} \z{二十} \\
320 \z{俄}\f{<}\z{羅}\f{V>}\z{斯} \f{\hash} \z{四十一} \\
321 \z{拉丁} \f{\hash} \z{二十三} \\
322 \z{希伯流} \f{\hash} \z{二十二} \\
323 \z{梵字} \f{\hash} \z{五十} \\
324 \f{</tb>}
325 \end{typeChinese}
326 } &
327 \includegraphics[height=6cm]{text14p43}
328 \end{tabular}
329
330
331 \subsubsection{Lists}
332 \label{section chinese lists}
333
334 %\mehrzeilen[5]
335
336 \begin{mainrule}
337 A list is marked by §<list>§ and §</list>§. Use §#§ for large spaces, if there are any.
338 \end{mainrule}
339
340 \begin{clarification}
341 Type the §<list>§ and §</list>§ tags on separate lines. If the items on consecutive text lines belong to the same list entry, use §#§ at the beginning of the next line. Do not mark indentations.
342 \end{clarification}
343
344 \begin{clarification}
345 Unlike in tables, type each single space, i.e. do not omit single spaces even if they seem to be merely decorative.
346 \end{clarification}
347
348 \begin{tabular}{@{}ll}
349 \parbox[b]{112mm}{
350 \htsc{Example} \\
351 \begin{typeChinese}
352 \f{<list>} \\
353 \z{(第一) 意大利語} \f{\hash} \z{西班牙語} \f{\hash} \z{法蘭西語 等} \\
354 \f{\hash} \z{同由拉丁語出} \\
355 \z{(第二) 俄}\f{<}\z{羅}\f{V>}\z{斯語} \f{\hash} \z{波蘭語} \f{\hash} \z{波希密亞語 等} \\
356 \f{\hash} \z{同由斯拉夫語出} \\
357 \z{(第三) 威爾斯語} \f{\hash} \z{希臘語} \f{\hash} \z{不列顚語 等} \\
358 \f{\hash} \z{同由塞爾語出} \\
359 \f{</list>} \\
360 \f{<p>}\z{以上屬於亞利安語系}\f{</p>} \\
361 \f{<list>} \\
362 \z{(第四) 亞刺比亞語} \f{\hash} \z{希伯流語} \f{\hash} \z{叙利亞語 等} \\
363 \f{\hash} \z{同由塞美的語出} \\
364 \f{</list>} \\[10mm]
365 \end{typeChinese}
366 } &
367 \includegraphics[height=8cm]{text14p32_2}
368 \end{tabular}
369
370 \begin{crossref}
371 For an example of a list-like structure without large spaces see \sect{section chinese tocs} (second example).
372 \end{crossref}
373
374
375 \subsubsection{Tables of Contents}
376 \label{section chinese tocs}
377
378 \mehrzeilen[5]
379
380 \begin{mainrule}
381 A table of contents is marked by §<toc>§ and §</toc>§. If the table of contents has a table-like structure or a list-like structure with large spaces, use §#§.
382 \end{mainrule}
383
384 \begin{clarification}
385 Type the §<toc>§ and §</toc>§ tags on separate lines. A table of contents may look like a table or like a list.
386 \end{clarification}
387
388 \vspace{3mm}
389 \begin{tabular}{@{}ll}
390 \parbox[b]{72mm}{
391 \htsc{Examples \\[2mm] \s{a table-like table of contents \\[2mm] a list-like table of contents \\ without large spaces}} \\[5mm]
392 \begin{typeChinese}
393 \f{<toc>} \\
394 \f{<h>}\z{第一章 天時}\f{</h>} \\
395 \z{日月} \f{\hash} \z{日月}\f{<}\z{蝕}\f{R>} \f{\hash} \z{地球} \f{\hash} \z{地球之圓體} \\
396 \z{地動說} \f{\hash} \z{遊星} \f{\hash} \z{七曜日} \f{\hash} \z{晝夜} \\
397 \z{時間} \f{\hash} \z{年月} \f{\hash} \z{歲首} \f{\hash} \f{<}\z{紀}\f{R>}\z{元} \\
398 \z{三時代} \f{\hash} \z{天氣豫報} \\
399 \f{<h>}\z{第二章 地理}\f{</h>} \\
400 \z{亞美利加} \f{\hash} \z{墺斯土剌利亞} \f{\hash} \z{蘇彛士河} \f{\hash} \z{山} \\
401 \z{堤埭} \f{\hash} \z{橋} \f{\hash} \z{周航地球} \f{\hash} \z{大洪水} \\
402 ... \\
403 \f{</toc>} \\[28mm]
404 \end{typeChinese}
405 } & \qquad
406 \parbox[b]{5cm}{
407 \includegraphics[height=8.5cm]{text14p5} \\[20mm] } \qquad
408 \includegraphics[height=11cm]{text17-1p7}
409 \end{tabular}
410
411 \vspace{-33mm}
412 \begin{typeChinese}
413 \f{<toc>} \\
414 ... \\
415 \z{安南稻 米麥 牛尾粟}\f{<sm>}\z{雀粟 鵞掌粟 狗尾}\f{\bs\bs}\z{粟 虎尾粟 }\f{<}\z{黄}\f{V>}\z{粟}\f{</sm>} \\
416 \z{黄粢 釣鈎黍}\f{<sm>}\z{馬尾黍 番黍 鴨脚黍}\f{\bs\bs}\z{ 黑黍 長}\f{<}\z{芒}\f{R>}\z{黍 膏黍}\f{</sm>}\z{ 豆}\f{<sm>}\z{白豆}\f{\bs\bs}\z{ 黄} \\
417 \z{豆 黑豆 綠豆 豇豆 豌豆 赤小豆 青豆}\f{\bs\bs}\z{ 褐豆 刀豆 虎爪豆 蠏眼豆 皂}\f{<}\z{莢}\f{R>}\z{豆 羊} \\
418 ... \f{</sm>} \\
419 \f{</toc>} \\
420 \end{typeChinese}
421
422
423 \tocspace
424 \subsection{Printed Images}
425
426
427 \subsubsection{Figures}
428 \label{section chinese figures}
429
430 \begin{mainrule}
431 Where a figure occurs in the text, type §<fig>§ on a separate line. If you can identify a caption of the figure, mark it by §<cap> </cap>§. Additional text that describes parts of the figure is marked by §<desc> </desc>§. Use a single §<var> </var>§ tag for variable names and numbers. Finally, type a closing §</fig>§ tag on a separate line.
432 %Figures are marked by §<fig>§ and §</fig>§ on separate lines. If you can identify a caption of the figure, mark it by §<cap> </cap>§. Additional text that describes parts of the figure is marked by §<desc> </desc>§.
433 \end{mainrule}
434
435 \begin{clarification}
436 Type all §<cap>§, §<desc>§ and §<var>§ tags, in this order, on separate lines. A figure may have more than one description. If the same description is repeated in a figure, type it only once. Separate the variable names and numbers in the §<var> </var>§ by spaces. Type §<fig/>§ instead of §<fig>§ and §</fig>§ to mark simple figures without §<cap>§, §<desc>§ or §<var>§ tags.
437 %Type the caption on a separate line after §<fig>§. A figure may have more than one description. Type each description on a separate line after §<fig>§ and §<cap>§. If the same description is repeated in a figure, type it only once.
438 \end{clarification}
439
440 \begin{tabular}{@{}ll}
441 \parbox[b]{8.3cm}{
442 \htsc{Examples} \\
443 \begin{typeChinese}
444 \f{<fig>} \\
445 \f{<cap>}\z{第九鐵餅正看圖}\f{<sm>}\z{四分之一}\f{</sm>}\f{</cap>} \\
446 \f{<desc>}\z{秋}\f{</desc>} \\
447 \f{<desc>}\z{收}\f{</desc>} \\
448 \f{</fig>} \\
449 \f{<fig>} \\
450 \f{<cap>}\z{鐵餅剖看圖}\f{</cap>} \\
451 \f{<desc>}\z{秋}\f{</desc>} \\
452 \f{<desc>}\z{螺帽}\f{</desc>} \\
453 \f{<desc>}\z{收}\f{</desc>} \\
454 \f{<desc>}\z{螺鍵}\f{</desc>} \\
455 \f{</fig>} \\
456 \end{typeChinese}} &
457 \includegraphics[width=8.1cm]{text18-1p24}
458 \end{tabular}
459
460 \vspace{5mm}
461 \begin{tabular}{@{}lll}
462 \parbox[b]{121mm}{
463 \begin{typeChinese}
464 \f{<fig>} \\
465 \f{<var>}\z{九} \z{甲} \z{六} \z{乙} \z{十二} \z{丙} \z{八} \z{丁}\f{</var>} \\
466 \f{</fig>} \\
467 \end{typeChinese}} &
468 \includegraphics[height=4cm]{Euklid1996_p266}
469 \end{tabular}
470
471 \begin{tabular}{@{}lll}
472 \parbox[b]{126.5mm}{
473 \begin{typeChinese}
474 \\
475 \f{<pb a><rh>}\z{泰西事物}\f{<}\z{起}\f{V>}\z{原 }\f{<sm>}\z{第三章}\f{</sm></rh>} \\
476 ... \\
477 \f{<fig>} \\
478 \f{<desc>}\z{第二大派}\f{</desc>} \\
479 \f{<desc>}\z{希伯流語}\f{</desc>} \\
480 \f{<desc>}\z{亞刺比亞語}\f{</desc>} \\
481 \\
482 \f{<pb b><rh>}\z{泰西事物起原 }\f{<sm>}\z{第三章}\f{</sm></rh>} \\
483 \f{<desc>}\z{非尼西亞語}\f{</desc>} \\
484 \f{</fig>} \\
485 ... \\
486 \end{typeChinese}} &
487 \includegraphics[height=5cm]{figure_14_33teil2} &
488 \includegraphics[height=5cm]{figure_14_33teil1}
489 \end{tabular}
490
491 \begin{tabular}{@{}lll}
492 \parbox[b]{8.3cm}{
493 \begin{typeChinese}
494 \f{<p>}\z{西洋大彈式十種 凡彈必合銃口徑以爲圓形故不預} \\
495 \z{定大小斤數}\f{</p>} \\
496 \f{<fig>} \\
497 \f{<desc>}\z{圓彈}\f{</desc>} \\
498 \f{</fig>} \\
499 \f{<fig>} \\
500 \f{<desc>}\z{中空}\f{<}\z{迎}\f{R>}\z{風} \\
501 \z{其聲如雷}\f{</desc>} \\
502 \f{<desc>}\z{響彈}\f{</desc>} \\
503 \f{</fig>} \\
504 \f{<fig>} \\
505 \f{<desc>}\z{中用百鍊鋼條兩頭銼} \\
506 \z{尖鑄時先定中}\f{<}\z{線}\f{R>}\z{毋使} \\
507 \z{稍偏長短致} \\
508 \z{有輕重低昂} \\
509 \z{不能直貫}\f{</desc>} \\
510 \f{<desc>}\z{遇賊攻} \\
511 \z{寨勢如} \\
512 \z{拉朽}\f{</desc>} \\
513 \f{</fig>} \\
514 \f{<fig>} \\
515 \f{<desc>}\z{彈形兩分中}\f{<}\z{綰}\f{R>}\z{百鍊} \\
516 \z{鋼條不拘長短點放} \\
517 \f{<}\z{迸}\f{R>}\z{發橫拉如火龍}\f{</desc>} \\
518 \f{<desc>}\z{鍊彈}\f{</desc>} \\
519 \f{</fig>} \\
520 \f{<fig>} \\
521 \f{<desc>}\z{最厚之城用十}\f{<}\z{餘}\f{R>}\z{彈先} \\
522 \z{鑿破磚石}\f{<}\z{繼}\f{R>}\z{以員彈推} \\
523 \z{倒}\f{</desc>} \\
524 \f{<desc>}\z{攻城}\f{</desc>} \\
525 \f{</fig>} \\
526 \f{<fig>} \\
527 \f{<desc>}\z{攻城攻墻一也特中用} \\
528 \z{鋼鑿大小厚薄不同耳} \\
529 \z{鑄法如前說}\f{</desc>} \\
530 \f{<desc>}\z{攻墻}\f{</desc>} \\
531 \f{</fig>} \\
532 \end{typeChinese}
533 } &
534 \parbox[b]{8cm}{
535 \includegraphics[height=12cm]{text16p69}
536 \vspace{14mm}
537 \\
538 }
539 \end{tabular}
540
541
542 \subsubsection{Stamps}
543 \label{section chinese stamps}
544
545 \begin{mainrule}
546 Stamps are marked by §<stamp>§. Type the §<stamp>§ tag on a separate line. Do not type the text in the stamp.
547 \end{mainrule}
548
549 \begin{crossref}
550 For an example see \sect{section chinese headings}.
551 \end{crossref}
552
553
554 \tocspace
555 \subsection{Unreadable Text}
556 \label{section unreadable text}
557
558
559 \subsubsection{Characters You are Unsure About}
560 \label{section characters you are unsure about}
561
562 \begin{mainrule}
563 If you are not sure about a character, type §<?>§ after it. If you are unsure about a whole paragraph, type §<?>§ directly after the §<p>§ tag, i.e. §<p><?>§. A completely unreadable character is typed as §@§. If many characters are unreadable, use §<gap>§ instead of §@§.
564 \end{mainrule}
565
566 \begin{clarification}
567 Use one §@§ for each unreadable character, e.g. §unr@@dable§. If in doubt, use §<gap>§, e.g. §unr<gap>dable§. If you are unsure about a group of characters, for example a whole word, do not type §<?>§ repeatedly for every character, e.g. type §word<?>§ rather than §w<?>o<?>r<?>d<?>§.
568 \end{clarification}
569
570 \begin{tabular}{@{}ll}
571 \parbox[b]{129.5mm}{
572 \htsc{Examples} \\[8mm]
573 \begin{typeChinese}
574 \z{上戊其日祀事禮成}\f{<?>@} \\
575 \z{陳尚明率元儒姬紹周}\f{<?>} \\[5mm]
576 \f{<dl>}\z{古禮}\f{</dl><?>}\z{德}\f{<}\z{運}\f{R>}\z{河之間。} \\[7mm]
577 \end{typeChinese}
578 } &
579 \includegraphics[height=5cm]{unreadable} \quad
580 \includegraphics[height=5cm]{text14p74_unclear}
581 \end{tabular}
582
583 \begin{note}
584 In the second example, the characters are readable but the double line (see \sect{section chinese underlinings}) is badly printed.
585 \end{note}
586
587 \begin{crossref}
588 For unknown rather than unreadable characters please refer to \sect{section unknown characters}.
589 \end{crossref}
590
591
592 \subsubsection{Unknown Characters}
593 \label{section unknown characters}
594
595 \begin{mainrule}
596 If there is an unknown character in the text, i.e. a character variant which is readable but where you cannot identify the standard character, add it to the numbered list of unknown characters. From then on, type its number whenever it occurs in the text, e.g. §<001>§.
597 \end{mainrule}
598
599 \begin{clarification}
600 Before you create a number for an unknown character, first check whether it is already on the list of unknown characters. Assign the number §<001>§ to the first unknown character, §<002>§ to the second unknown character, and so on. Do not assign the same number twice. Use this number to type the unknown character. Always use the same number if the same unknown character occurs again.
601 \end{clarification}
602
603 \begin{note}
604 Make sure that for a given text there is a single list containing all unknown characters, and that everyone uses this list. When the text is sent back to us, we will need a copy of this list. (See also \sect{section file conventions}.)
605 \end{note}
606
607 \begin{tabular}{@{}ll}
608 \parbox[b]{145.5mm}{
609 \htsc{Example \\[2mm] \s{an unknown character}} \\[15mm]
610 \begin{typeChinese}
611 \f{<}\z{得}\f{V>}\z{梁}\f{<001>}\z{玉}\f{<}\z{虎}\f{V><}\z{枕}\f{V>} \\[7mm]
612 \end{typeChinese}
613 } & \qquad
614 \includegraphics[height=5cm]{unknown_chinese_character2}
615 \end{tabular}
616
617 \vspace{3mm}
618 \begin{crossref}
619 For unreadable rather than unknown characters please refer to \sect{section characters you are unsure about}. For §< V>§, i.e. if a character variant is not included in Unicode but you can identify the standard character, see \sect{section character variants}.
620 \end{crossref}
621
622 \vspace{3mm}
623 \begin{note}
624 %§<001>§ is actually an unusual version of the variant \z{兾} of the character \z{冀}. If you can identify it as a version of the character variant, mark it as §<§\z{兾}§V>§ instead of §<001>§. If you cannot identify the variant but you can identify the standard character, mark it as §<§\z{冀}§V>§.
625 §<001>§ is actually an unusual version of the variant \z{兾} of the character \z{冀}. If you can identify the standard character \z{冀}, mark it as §<§\z{冀}§V>§ instead of §<001>§.
626
627 If in addition you can identify it as a version of the character variant \z{兾} (i.e. as a version of a character variant with a separate Unicode codepoint), mark it as §<§\z{兾}§V>§. (This special case is not mentioned in \sect{section character variants}.)
628 \end{note}
629
630
631 \tocspace
632 \section{Chinese Characters}
633
634 \tocspace
635 \subsection{General}
636
637 \subsubsection{Punctuation}
638 \label{section chinese punctuation}
639
640 \begin{mainrule}
641 Type the punctuation to the right of characters.
642 \end{mainrule}
643
644 \begin{crossref}
645 For an example see \sect{section chinese paragraphs}.
646 \end{crossref}
647
648
649 \subsubsection{Spaces}
650
651 \begin{mainrule}
652 Type spaces in Chinese text as the IDEOGRAPHIC SPACE character U+3000.
653 \end{mainrule}
654
655 \begin{clarification}
656 In running heads (§<rh>§, see \sect{section page breaks}) and headings (§<h>§ and §<ti>§, see \sect{section chinese headings}), type large spaces as a single ideographic space character.
657 In tables and lists (§<tb>§, §<list>§ and §<toc>§, see \sect{section structured text}), use §#§ for large spaces.
658 \end{clarification}
659
660 \begin{clarification}
661 If you encounter a large space in a normal paragraph (§<p>§, see the example in \sect{section chinese paragraphs}, third line from the bottom), make sure that none of the cases above apply. If it is indeed a normal paragraph, type the large space as more than one ideographic space, according to its length.
662 \end{clarification}
663
664 \begin{crossref}
665 For an example of large spaces that are typed as a single ideographic space character, see \sect{section page breaks}. For an example of large spaces that are typed as §#§, see \sect{section tables}.
666 \end{crossref}
667
668
669 \tocspace
670 \subsection{Character Variants}
671 \label{section character variants}
672
673
674 \subsubsection{Character Variants and Unicode}
675 \label{section character variants and unicode}
676
677 \begin{mainrule}
678 If a character variant is included in Unicode 5.1, type it. Do not normalize the variant.
679 %The rest of this section applies only to characters which are not included in Unicode.
680 \end{mainrule}
681
682 \begin{clarification}
683 For example, if the character variant \z{歴} of the character \z{歷} occurs in the text, type \z{歴} (U+6B74).
684 %\end{clarification}
685 %
686 %\begin{clarification}
687 Rather than working with the reference glyphs of the Unicode codepoints, you may use the fonts Sun-ExtA and Sun-ExtB normatively.
688 \end{clarification}
689
690 \vspace{5mm}
691 \begin{mainrule}
692 If a character variant is not included in Unicode 5.1, type the standard character instead. In addition, mark it by §< R>§ or §< V>§ if the rules in \sect{section rules for marking character variants} apply.
693 \end{mainrule}
694
695 \begin{crossref}
696 If you cannot identify the standard character, treat it as unknown character (see \sect{section unknown characters}).
697 \end{crossref}
698
699 \begin{clarification}
700 If a character variant should be marked, add it to the Character Variants List, i.e. add the image and how you have marked it. In addition, mark the first occurrence of the character variant in the text. After its first occurrence, silently normalize it. Begin a new Character Variants List for each text.
701 \end{clarification}
702
703 \begin{note}
704 In rare cases, the same text may contain the standard character and one or more different variants of this character. Please make a note in the Character Variants List, e.g. “S + V” or “V1 + V2” or “S + V1 + V2”. Include an image of each variant. In the text, mark the first occurrence of each variant using §< V1>§, §< V2>§, etc. Do not mark the standard character.
705 \end{note}
706
707 %\vspace{5mm}
708 \subsubsection{Rules for Marking Character Variants}
709 \label{section rules for marking character variants}
710
711 This sections contains \textsf{\textbf{Rule S}} for simple differences that need not be marked, \textsf{\textbf{Rule R}} for marking old radicals, and \textsf{\textbf{Rule V}} for other variations.
712
713 \begin{mainrule}
714 \paragraph{Rule S (silently normalizing simple differences):} If a character variant differs from the standard character only in the following points, type it as the standard character and do not mark the difference.
715 \end{mainrule}
716
717 \begin{clarification}
718 In paragraphs with individualized character style (see \sect{section individualized character style}) and in handwritten text (see \sect{section handwritten text}), silently normalize character variants if they are not in Unicode.
719 \end{clarification}
720
721 %\vspace{2mm}
722 %\begin{liste}[ 1: \, normalizations (from ISO 10646, slightly modified)]
723 %\begin{longtable}{@{}l@{ }ll} \\
724 %& Description & Examples \\[2mm]
725 %a) & Differences in rotated strokes/dots & \includegraphics{iso-a} \\
726 %b) & \parbox[t]{8cm}{Differences in overshoot at the stroke initiation and/or termination} & \includegraphics{iso-b} \\
727 %c) & \parbox[t]{8cm}{Differences in contact of strokes} & \includegraphics{iso-c} \\
728 %d) & \parbox[t]{8cm}{Differences in protrusion at the folded corner of strokes} & \includegraphics{iso-d} \\
729 %e) & \parbox[t]{8cm}{Differences in bent strokes} & \includegraphics{iso-e} \\
730 %f) & \parbox[t]{8cm}{Differences in folding back at the stroke termination} & \includegraphics{iso-f} \\
731 %g) & \parbox[t]{8cm}{Differences in accent at the stroke initiation} & \includegraphics{iso-g} \\
732 %h) & \parbox[t]{8cm}{Differences in “rooftop” modification} & \includegraphics{iso-h} \\
733 %i) & \parbox[t]{8cm}{Straightforward combinations of the above differences} & \includegraphics{iso-j} \\
734 %\end{longtable}
735 %\end{liste}
736
737 % Version aus 2.0.1:
738 %\vspace{3mm}
739 %\begin{liste}[: \, simple differences the need NOT be marked \, (from ISO 10646, slightly modified)]
740 %\begin{longtable}{@{}l@{ }ll}
741 %& Description & Examples \\[5mm]
742 %a) & Differences in rotated strokes/dots & \parbox[m]{8cm}{ \includegraphics{iso-a} } \\[5mm]
743 %b) & \parbox[m]{8cm}{Differences in overshoot at the stroke initiation and/or termination} & \parbox[m]{8cm}{ \includegraphics{iso-b2} } \\[5mm]
744 %c) & \parbox[t]{8cm}{Differences in contact of strokes} & \parbox[m]{8cm}{ \includegraphics{iso-c} } \\[5mm]
745 %d) & \parbox[m]{8cm}{Differences in protrusion at the folded corner of strokes} & \parbox[m]{8cm}{ \includegraphics{iso-d} } \\[5mm]
746 %e) & \parbox[t]{8cm}{Differences in bent strokes} & \parbox[m]{8cm}{ \includegraphics{iso-e} } \\[5mm]
747 %f) & \parbox[m]{8cm}{Differences in folding back at the stroke termination} & \parbox[m]{8cm}{ \includegraphics{iso-f} } \\[5mm]
748 %g) & \parbox[m]{8cm}{Differences in accent at the stroke initiation} & \parbox[m]{8cm}{ \includegraphics{iso-g} } \\[5mm]
749 %h) & \parbox[t]{8cm}{Differences in “rooftop” modification} & \parbox[m]{8cm}{ \includegraphics{iso-h} } \\[5mm]
750 %i) & \parbox[m]{8cm}{Straightforward combinations of the above differences} & \parbox[m]{8cm}{ \includegraphics{iso-j} } \\[5mm]
751 %\end{longtable}
752 %\end{liste}
753
754
755 %& \multicolumn{2}{@{}l}{\parbox[m]{16cm}{Do not mark \includegraphics{chin21zhi} (\z{之}) where the dot at the top touches or even overshoots the horizontal stroke. }} \\[5mm]
756 %& \multicolumn{2}{@{}l}{\parbox[m]{16cm}{Similarly, do not mark the difference between \includegraphics{chin21zhi} CHI and \z{斥} .}} \\[10mm]
757 %& \multicolumn{2}{@{}l}{\parbox[m]{16cm}{However, DO mark the difference between \z{亠} and \z{十} and between \z{卜} and \z{十}. Examples: \includegraphics{chin21zhi} HUAI <\z{櫰}V>, \includegraphics{chin21zhi} FEI <\z{肺}V>.}} \\[10mm]
758
759 \vspace{3mm}
760 \begin{liste}[: \, simple differences \, (with excerpts from ISO 10646)]
761
762 a) Differences in rotated strokes/dots
763
764 \begin{itemize}
765 \item[‒] Do NOT mark \,\parbox{8cm}{ \includegraphics{iso-a} }
766
767 \item[‒] Do NOT mark
768 \parbox{9mm}{ \includegraphics{chin21a1} } (\z{之})
769 where the dot at the top touches or even overshoots the horizontal stroke.
770 Similarly, do not mark the difference between
771 \parbox{8mm}{ \includegraphics{chin21a2} } and \z{斥}.
772
773 \vspace{2mm}
774 \item[+] DO mark the difference between \z{亠} and \z{十} and between \z{卜} and \z{十}. \\ Examples: \,
775 \parbox{8mm}{ \includegraphics{chin21a3} } <\z{櫰}V>,
776 \parbox{10mm}{ \includegraphics{chin21a4} } <\z{肺}V>.
777 \end{itemize}
778
779 \vspace{5mm}
780 b) Differences in overshoot at the stroke initiation and/or termination
781
782 \begin{itemize}
783 \item[‒] Do NOT mark \,\parbox{8cm}{ \includegraphics{iso-b2} }
784
785 \item[‒] Do NOT mark
786 \parbox{9mm}{ \includegraphics{chin21b1} } (\z{瓦}),
787 \parbox{8mm}{ \includegraphics{chin21b2} } (\z{耶}), or
788 \parbox{9mm}{ \includegraphics{chin21b4} } (\z{承}).
789 Also do not mark
790 \parbox{9mm}{ \includegraphics{chin21b5} } (\z{皴}),
791 i.e. the differences in the overshot/non-overshot of the character part \z{夕}.
792
793 \vspace{2mm}
794 \item[+] DO mark vertical (\z{竪}) and left-slanted (\z{撇}) overshoots. \\
795 Examples: \,
796 \parbox{9mm}{ \includegraphics{chin21b6} } <\z{割}V>,
797 \parbox{7mm}{ \includegraphics{chin21b7} } <\z{除}V>,
798 \parbox{10mm}{ \includegraphics{chin21b8} } <\z{楔}V>,
799 \parbox{10mm}{ \includegraphics{chin21b9} } <\z{鄂}V>,
800 \parbox{9mm}{ \includegraphics{chin21b10} } <\z{蛇}V>.
801 \end{itemize}
802
803 \vspace{5mm}
804 c) Differences in contact of strokes
805
806 \begin{itemize}
807 \item[‒] Do NOT mark \,\parbox{8cm}{ \includegraphics{iso-c} }
808
809 \item[+] DO mark connections of the vertical strokes of the component \z{日} with a horizontal stroke \z{一} below that look like a change from \z{旦} to \z{且}. \\
810 Example: The component \z{昜} in
811 \parbox{9mm}{ \includegraphics{chin21c1} } <\z{盪}V>.
812 %\includegraphics{chin21c1test.pdf} <\z{盪}V>.
813 \end{itemize}
814
815 \vspace{5mm}
816 d) Differences in protrusion at the folded corner of strokes
817
818 \begin{itemize}
819 \item[‒] Do NOT mark \,\parbox{8cm}{ \includegraphics{iso-d} }
820
821 \item[‒] Do NOT mark
822 \parbox{7mm}{ \includegraphics{chin21d1.pdf} } (\z{繩}) or
823 \parbox{7mm}{ \includegraphics{chin21d2.pdf} } (\z{斲}).
824
825 \item[‒] Do NOT mark the difference between the character components \z{已} (\textit{ji} “self”) and \z{己} (\textit{yi} “already”) unless you are completely sure.
826
827 \item[+] DO mark the difference between \z{巳}
828 %(\textit{si}, Earthly Branch “snake”)
829 and \z{已} / \z{己}. \\
830 Examples: \,
831 \parbox{7.5mm}{ \includegraphics{chin21d3.pdf} } <\z{忌}V>,
832 \parbox{9mm}{ \includegraphics{chin21d4.pdf} } <\z{包}V>.
833
834 \item[+] DO mark the difference between \z{㔾} and \z{巳} and the difference between \z{皿} and \z{罒}. \\
835 Examples: \,
836 \parbox{8mm}{ \includegraphics{chin21d5.pdf} } <\z{卷}V>,
837 \parbox{7mm}{ \includegraphics{chin21d6.pdf} } <\z{服}V>,
838 \parbox{7mm}{ \includegraphics{chin21d7.pdf} } <\z{衆}V>.
839 \end{itemize}
840
841 \vspace{5mm}
842 e) Differences in bent strokes
843
844 \begin{itemize}
845 \item[‒] Do NOT mark \,\parbox{8cm}{ \includegraphics{iso-e} }
846
847 \item[+] DO mark the difference between \z{巜} and \z{刂} and the difference between \z{术} and \z{朮}. In general, mark differences in the shape of a stroke if they lead to a different character component. \\
848 Examples: \,
849 \parbox{7mm}{ \includegraphics{chin21e1.pdf} } <\z{俞}V>,
850 \parbox{8mm}{ \includegraphics{chin21e2.pdf} } <\z{述}V>.
851 \end{itemize}
852
853 \vspace{5mm}
854 f) Differences in folding back at the stroke termination
855
856 \begin{itemize}
857 \item[‒] Do NOT mark \,\parbox{8cm}{ \includegraphics{iso-f} }
858 \end{itemize}
859
860 \vspace{5mm}
861 g) Differences in accent at the stroke initiation
862
863 \begin{itemize}
864 \item[‒] Do NOT mark \,\parbox{8cm}{ \includegraphics{iso-g} }
865 \end{itemize}
866
867 \vspace{5mm}
868 h) Differences in “rooftop” modification
869
870 \begin{itemize}
871 \item[‒] Do NOT mark \,\parbox{8cm}{ \includegraphics{iso-h} }
872
873 \item[‒] Do NOT mark for example
874 \parbox{7mm}{ \includegraphics{chin21h1.pdf} } (\z{肉}).
875
876 \item[+] DO mark the difference between \z{几} and \z{儿}. \\
877 Examples: \,
878 \parbox{8mm}{ \includegraphics{chin21h2.pdf} } <\z{兜}V>,
879 \parbox{7mm}{ \includegraphics{chin21h3.pdf} } <\z{虎}V>.
880 \end{itemize}
881
882 \vspace{5mm}
883 i) Straightforward combinations of the above differences
884
885 \begin{itemize}
886 \item[‒] Do NOT mark \,\parbox{8cm}{ \includegraphics{iso-j} }
887 \end{itemize}
888
889 \end{liste}
890
891 \vspace{3mm}
892 \begin{note}
893 The rules a) to i) leave the number of strokes unchanged. Consequently, changes in the number of strokes cannot be silently normalized and must be marked.
894
895 \vspace{2mm}
896 Note, however, that in some printing styles the strokes \extB{𠄌} (\textit{shuti} \z{竪提}) and \extB{𠃊} (\textit{shuzhe} \z{竪折}) appear to be a combination of two strokes, i.e. “vertical” (\z{丨}) plus “upward-slanted” (\z{㇀}). Do not mark these printing styles. \\
897 Examples: \,
898 \parbox{7mm}{ \includegraphics{chin21n1.pdf} } (\z{裏}),
899 \parbox{9mm}{ \includegraphics{chin21n2.pdf} } (\z{震}),
900 \parbox{6.5mm}{ \includegraphics{chin21n3.pdf} } (\z{改}),
901 \parbox{7mm}{ \includegraphics{chin21n4.pdf} } (\z{粵}),
902 \parbox{10mm}{ \includegraphics{chin21n5.pdf} } (\z{仰}).
903 \end{note}
904
905 \begin{mainrule}
906 \paragraph{Rule R (marking old radicals):} If a character such as \z{絨} (U+7D68) exists in Unicode 5.1 only with the new shape \z{糹} (U+7CF9) of the radical (\emph{bushou} \z{部首}) and not with the old shape \z{糸} (U+7CF8), mark the character variant with the old radical by §< R>§, for example §<§\z{絨}§R>§. Apply this rule only if the difference between the old and the new radical is not covered by rule S.
907 \end{mainrule}
908
909 \begin{crossref}
910 Appendix \ref{appendix radicals} contains a list of radicals that need to be marked.
911 \end{crossref}
912
913 \begin{note}
914 %The most significant examples of this rule are those where a graphem originally belonging to the sound-part of a character took over a graphical position that normally belongs to a radical while the actual radical of the character is "swallowed" by the sound-part. \\
915 %Rule R also applies when a character component has moved from the sound-part of the character to the radical part. \\
916 Rule R also applies when a character component from the sound-part of the character has swapped places with the actual radical. \\
917 Examples: \,
918 \parbox{10mm}{ \includegraphics{chin21r1.pdf} } <\z{穫}R>,
919 \parbox{5mm}{ \includegraphics{chin21r2.pdf} } <\z{墜}R>.
920 \end{note}
921
922 %\vspace{5mm}
923 \begin{mainrule}
924 \paragraph{Rule V (marking other variations):} If the non-radical part of the character variant differs from that of the standard character, mark the character variant with §< V>§. Apply this rule only if the difference is not covered by rule S.
925 \end{mainrule}
926
927 %\vspace{5mm}
928 %\begin{tabular}{@{}ll}
929 %\parbox[b]{134mm}{
930 %\htsc{Example \\[2mm] \s{a character variant with an additional stroke}} \\[-2mm]
931 %\begin{typeChinese}
932 %\f{<}\z{彈}\f{V>} \\
933 %\end{typeChinese}
934 %} & \qquad
935 % \includegraphics[height=2cm]{variante}
936 %\end{tabular}
937
938 %\begin{tabular}{@{}ll}
939 %\parbox[b]{139.5mm}{
940 %\htsc{Example \\[2mm] \s{a character variant not included in Unicode 5.1.0}} \\[15mm]
941 %\begin{typeChinese}
942 %\z{郡兩}\f{<}\z{穫}\f{V>}\z{者} \\[7mm]
943 %\end{typeChinese}
944 %} & \qquad
945 %\includegraphics[height=5cm]{text17-1p15_klein}
946 %\end{tabular}
947
948 \vspace{3mm}
949 \begin{tabular}{@{}ll}
950 \parbox[b]{122.5mm}{
951 \htsc{Examples} \\[15mm]
952 \begin{typeChinese}
953 \f{<}\z{彈}\f{V>} \\[5mm]
954 \z{郡兩}\f{<}\z{穫}\f{R>}\z{者} \\[5mm]
955 \end{typeChinese}
956 } &
957 \includegraphics[height=1.5cm]{variante} \qquad
958 \includegraphics[height=5cm]{text17-1p15_klein}
959 \end{tabular}
960
961 \vspace{2mm}
962 \begin{clarification}
963 If both rule R and rule V apply, mark the character variant by §< RV>§; see the example §<§\z{過}§RV>§ in \sect{section chinese paragraphs}.
964 \end{clarification}
965
966
967 \tocspace
968 \subsection{Type Styles}
969
970 \subsubsection{Small Characters}
971 \label{section chinese small characters}
972
973 \begin{mainrule}
974 Strings of small characters are marked by §<sm> </sm>§. Indicate half-column breaks by §\\§.
975 \end{mainrule}
976
977 \begin{crossref}
978 For an example see \sect{section chinese tocs} (second example). This examples includes strings of small characters over more than one line of text.
979 \end{crossref}
980
981
982 %\mehrzeilen[3]
983
984 \subsubsection{Underlinings}
985 \label{section chinese underlinings}
986
987 \begin{mainrule}
988 A single line next to characters is marked by §<sl> </sl>§.
989 A double line next to characters is marked by §<dl> </dl>§.
990 A circled line next to characters is marked by §<cl> </cl>§.
991 A wavy line next to characters is marked by §<wl> </wl>§.
992 \end{mainrule}
993
994 \begin{note}
995 In old texts, the lines are to the right of characters. In modern texts, the lines may also be to the left of characters. The position to the left or right is not encoded.
996 \end{note}
997
998 \begin{tabular}{@{}ll}
999 \parbox[b]{139mm}{
1000 \htsc{Example \\[2mm] \s{underlinings to the left and right}} \\[15mm]
1001 \begin{typeChinese}
1002 \f{<sl>}\z{康熙}\f{</sl><wl>}\z{寶應縣志}\f{</wl>}\z{人物志: 柏叢桂} \\
1003 \z{有司寢不行。}\f{<cl><sl>}\z{叢桂}\f{</sl>}\z{更相度地形畫圖}\f{</cl>}\z{。} \\[12mm]
1004 \end{typeChinese}
1005 } & \qquad
1006 \includegraphics[height=6cm]{Specs-Bild1_2}
1007 \end{tabular}
1008
1009 \begin{crossref}
1010 For an example with underlinings to the right of characters see \sect{section chinese paragraphs}. This example includes §<dl>§ for double lines.
1011 \end{crossref}
1012
1013 \newpage
1014 \subsubsection{Individualized Character Style}
1015 \label{section individualized character style}
1016
1017 \begin{mainrule}
1018 A paragraph in an individualized character style is marked by §ics§ in the §<p>§ tag, i.e. §<p ics>§.
1019 \end{mainrule}
1020
1021 \begin{clarification}
1022 If a character variant in a §<p ics>§ paragraph is not in Unicode, resolve it silently, i.e. do not use §< V>§ or §< R>§. However, use §<001>§ if a character is unknown.
1023 \end{clarification}
1024
1025 \begin{tabular}{@{}ll}
1026 \parbox[b]{138.5mm}{
1027 \htsc{Example} \\[5mm]
1028 \begin{typeChinese}
1029 \f{<p ics>}\z{光緒十六年} \\
1030 \z{冬印扵天津} \\
1031 \z{李鴻章署检}\f{</p>} \\[5mm]
1032 \end{typeChinese}
1033 } &
1034 \includegraphics[height=4cm]{text18-1p2}
1035 \end{tabular}
1036
1037
1038 \subsubsection{Handwritten Text}
1039 \label{section handwritten text}
1040
1041 \begin{mainrule}
1042 %%If a character has been crossed out, mark it by §{ }§.
1043 %%If there is a corrected character next to the crossed-out character, mark this by §{ / }§.
1044 %%If there is a line between two consecutive characters indicating that the order should be reversed, mark this by §{ ~ }§, but type the characters in the order as they appear in the text.
1045 %If a character has been crossed out, mark it by §{ -}§. e.g. §{§\z{四}§-}§.
1046 %If there is a corrected character next to the crossed-out character, mark this by §{ - }§, e.g. §{§\z{四}§-§\z{五}§}§. If one character has been written on top of another character and the original character is no longer readable, mark it by §{- }§, e.g. §{@-§\z{五}§}§.
1047 %If there is a line between two consecutive characters indicating that the order should be reversed, mark this by §{ ~ }§, but type the characters in the order as they appear in the text.
1048 If a character has been crossed out, mark it by §{ /}§, e.g. §{§\z{四}§/}§. If a character has been inserted, mark it by §{ }§, e.g. §{§\z{五}§}§. If the inserted character replaces a crossed-out character, mark this by §{§\z{四}§/§\z{五}§}§, or §{@/§\z{五}§}§ if the crossed-out character is no longer readable.
1049 \end{mainrule}
1050
1051 \begin{mainrule}
1052 If there is a line between two consecutive characters indicating that the order should be reversed, mark this by §{ ~ }§, but type the characters in the order as they appear in the text.
1053 \end{mainrule}
1054
1055 \begin{clarification}
1056 If a character variant in handwritten text is not in Unicode, resolve it silently, i.e. do not use §< V>§ or §< R>§. However, use §<001>§ if a character is unknown.
1057 \end{clarification}
1058
1059 \vspace{3mm}
1060 \begin{tabular}{@{}ll}
1061 \parbox[b]{56mm}{
1062 \htsc{Examples} \\[6mm]
1063 \begin{typeChinese}
1064 \z{均}\f{\{}\z{的加减号於次均}\f{\}}\z{旁又随錄} \\[5mm]
1065 \z{行內}\f{\{}\z{倒}\f{/}\z{减}\f{\}}\z{去} \\[2mm]
1066 \z{維}\f{\{@/}\z{揚}\f{\}}\z{人家} \\[5mm]
1067 \f{\{}\z{左}\f{\tld}\z{其}\f{\}} \\
1068 \end{typeChinese}
1069 } &
1070 \includegraphics[height=5cm]{tian_p18} \qquad
1071 \includegraphics[height=5cm]{hd_tian_p23} \,\,
1072 \includegraphics[height=5cm]{yin1_p27} \qquad
1073 \includegraphics[height=5cm]{xing_jing_p39}
1074 \end{tabular}
1075
1076 %\begin{tabular}{@{}ll}
1077 %\parbox[b]{8cm}{
1078 %\htsc{Examples} \\[25mm]
1079 %\begin{typeChinese}
1080 %xx\bold{\{}x\bold{\}}xx \\ \\
1081 %xxxx\{x/x\}\{x/x\}xx \\ \\
1082 %xx\bold{\tld}xxx \\
1083 %\end{typeChinese}
1084 %} & \qquad
1085 %\includegraphics[height=6cm]{Specs-Bild2-kt}
1086 %\end{tabular}
1087
1088 %%Or something like §<del>x</del>§, §<repl>xx</repl>§ and §<rev>xx</re>§?
1089
1090 \appendix
1091
1092 \newpage
1093 \section{Old Radicals That Need to be Marked}
1094 \label{appendix radicals}
1095
1096 \begin{note}
1097 This list is only a guideline and may not be complete.
1098 \end{note}
1099
1100 An entry such as \hira{⺿} \z{⻀} §(§\z{⺾}§)§ means that if a character has \hira{⺿} or \z{⻀} as the shape of its radical, and the character with this variant radical is not included in Unicode 5.1, type the standard character and add §< R>§.
1101 Example: §<§\z{蒼}§R>§.
1102
1103 Example of a radical that does not have to be marked: Do not mark the old shape \mincho{爫} of the radical \z{爫} because of point a) in the list in \sect{section rules for marking character variants}.
1104
1105 \vspace{3mm}
1106 \begin{liste}[: \, old radicals that need to be marked]
1107 \begin{tabular}{@{}l@{ }lll@{ }lll@{ }lll@{ }l} \\
1108 \z{彑} & §(§\z{彐}§)§ &&
1109 \z{糸} & §(§\z{糹}§)§ &&
1110 \z{⻞} & §(§\z{⻟}§)§ &&
1111 \sunExtB{𦈢} & §(§\z{缶}§)§ \\[2mm]
1112 \sunExtB{𦣞} & §(§\z{臣}§)§ &&
1113 \z{襾} & §(§\z{西}§)§ &&
1114 \sunExtB{𧢲} & §(§\z{角}§)§ &&
1115 \sunExtB{𧰧} & §(§\z{豕}§)§ \\[2mm]
1116 \z{赱} & §(§\z{走}§)§ &&
1117 \sunExtB{𨑄𨑃} & §(§\z{辰}§)§ &&
1118 \mincho{辶} & §(§\z{辶}§)§ &&
1119 \z{采} & §(§\z{釆}§)§ \\[2mm]
1120 \z{镸} & §(§\z{長}§)§ &&
1121 \sunExtA{门}\sunExtB{𨳇} & §(§\z{門}§)§ &&
1122 \sunExtB{𨸏} & §(§\z{阝}§)§ &&
1123 \z{靑} & §(§\z{青}§)§ \\[2mm]
1124 \sunExtA{靣}\sunExtB{𠚑} & §(§\z{面}§)§ &&
1125 \z{凬} & §(§\z{風}§)§ &&
1126 \sunExtB{𩙱} & §(§\z{飛}§)§ &&
1127 \sunExtB{𩙿𩚁} & §(§\z{飠}§)§ \\[2mm]
1128 \sunExtB{𩠐} & §(§\z{首}§)§ &&
1129 \sunExtB{𩡧} & §(§\z{馬}§)§ &&
1130 \z{髙} & §(§\z{高}§)§ &&
1131 \sunExtB{𩵋} & §(§\z{魚}§)§ \\[2mm]
1132 \sunExtB{𠧸} & §(§\z{鹵}§)§ &&
1133 \sunExtB{𢉖} & §(§\z{鹿}§)§ &&
1134 \z{黃} & §(§\z{黄}§)§ &&
1135 \z{黒} & §(§\z{黑}§)§ \\[2mm]
1136 \sunExtB{𪗄} & §(§\z{⿑}§)§ &&
1137 \z{歯} & §(§\z{齒}§)§ &&
1138 \sunExtB{𪛉𪚦} & §(§\z{⿔}§)§ &&
1139 \hira{⺿} \z{⻀} & §(§\z{⺾}§)§ \\
1140 \end{tabular}
1141 \end{liste}
1142
1143 \newpage
1144 \section{List of All Tags}
1145 \label{appendix list of all tags}
1146
1147 \begin{longtable}[l]{@{}llll@{}l@{}}
1148 section & tag & name & tag may contain \\[1mm]
1149 \hline \\
1150 \ref{section page breaks} & §<pb>§ & page break & page number, a/b \\
1151 \ref{section page breaks} & §<rh> </rh>§ & running head &\\
1152 \\
1153 \ref{section chinese headings} & §<h> </h>§ & heading & level number \\
1154 \ref{section chinese headings} & §<ti> </ti>§ & \emph{ti} \z{題} &\\
1155 \ref{section chinese paragraphs} & §<p> </p>§ & paragraph & §i§, §x§, §ics§ \\
1156 \\
1157 \ref{section tables} & §<tb> </tb>§ & table &\\
1158 \ref{section tables} & §#§ & field separator \\
1159 \ref{section chinese lists} & §<list> </list>§ & list &\\
1160 \ref{section chinese tocs} & §<toc> </toc>§ & table of contents &\\
1161 \\
1162 \ref{section chinese figures} & §<fig> </fig>§ & figure & \\
1163 \ref{section chinese figures} & §<cap> </cap>§ & figure caption &\\
1164 \ref{section chinese figures} & §<desc> </desc>§ & figure description &\\
1165 \ref{section chinese figures} & §<var> </var>§ & figure variables &\\
1166 \ref{section chinese stamps} & §<stamp> </stamp>§ & stamp & \\
1167 \\
1168 \ref{section characters you are unsure about} & §<?>§ & uncertain text & \\
1169 \ref{section characters you are unsure about} & §@§, §<gap>§ & unreadable text & \\
1170 \ref{section unknown characters} & §<001>§, etc. & unknown character & \\
1171 \\
1172 \hline \\
1173 \ref{section rules for marking character variants} & §< R>§ & old radical & \\
1174 \ref{section rules for marking character variants} & §< V>§ & character variant & \\
1175 \ref{section rules for marking character variants} & §< RV>§ & §< R>§ and §< V>§ & \\
1176 \\
1177 \ref{section chinese small characters} & §<sm> </sm>§ & small characters & \\
1178 \ref{section chinese small characters} & §\\§ & half-column breaks && \\
1179 \\
1180 \ref{section chinese underlinings} & §<sl> </sl>§ & single line & \\
1181 \ref{section chinese underlinings} & §<dl> </dl>§ & double line & \\
1182 \ref{section chinese underlinings} & §<cl> </cl>§ & circled line & \\
1183 \ref{section chinese underlinings} & §<wl> </wl>§ & wavy line & \\
1184 \\
1185 \ref{section handwritten text} & §{ /}§ & crossed-out character & \\
1186 \ref{section handwritten text} & §{ }§ & inserted character & \\
1187 \ref{section handwritten text} & §{ / }§ & character replacement & \\
1188 \ref{section handwritten text} & §{ ~ }§ & reversed characters & \\
1189 \\
1190 \hline \\
1191 \end{longtable}
1192
1193 \end{document}