--- storage/meta/meta-format.tex 2003/08/15 22:29:42 1.7 +++ storage/meta/meta-format.tex 2003/09/11 14:21:42 1.10 @@ -16,7 +16,7 @@ \author{Robert Casties, Dirk Wintergrün, Hans-Christoph Liess} -\date{V1.0.1 of 12.8.2003} +\date{V1.0.3 of 11.9.2003} \begin{document} @@ -523,7 +523,7 @@ appear multiple times. \end{description} -\subsection{Information on the document structure (table of contents)} +\subsection{Document structure (table of contents)} \label{sec:toc} Information on the structure of a document like the division into @@ -606,7 +606,7 @@ tags. %%\url{http://pythia.mpiwg-berlin.mpg.de/toolserver/TS_lise} -\subsection{Information on scanned images} +\subsection{Scanned images} \label{sec:inform-scann-imag} Image files representing scanned images can have an \texttt{img} @@ -659,11 +659,67 @@ or \end{description} + +\subsection{Image acquisition} +\label{sec:inform-about-image} + +A description of the technology used in the process of producing a +digital image. + +\begin{description} +\item[image-acquisition] description of the image production process + \begin{description} + \item[device] acquisition device (e.g. ``flatbed scanner'') + + \item[image-type] type and color-depth of the image (e.g. ``RGB 24 + bit'') + + \item[postproduction] additional operations on the image + (e.g. ``sharpening, color correction'') + + \item[production-comment] additional textual information about the + production process + \end{description} +\end{description} + + \subsection{Full text with images} \label{sec:full-text-with} -The relation of a full text in a XML format and optional images of -whole pages or parts of pages +Full text in a XML format will be specified with a +\texttt{content-type} ``fulltext''. + +The relation between the full text and optional images of +whole pages or parts of pages must be specified in a +\texttt{text-tool} container. + +\begin{description} +\item[text-tool] representation of full text with images + + \begin{description} + \item[text-file] the file name of the full text file (with path + inside document directory) + + \item[page-images] the directory name of the directory containig the + page image files (with path + inside document directory) + + \item[xslt-file] the file name of an additional XSL transformation + file + + \item[text-config] container for configuration options + \begin{description} + \item[container-tag] the name of the text root element (default + ``text'') + + \item[ref-element-tag] the name of the element that is used as + unit of reference when results are presented + + \item[pagebreak-tag] the name of the element that indicates page + breaks (default ``pb'') + \end{description} + \end{description} +\end{description}