comparison software/mpdl-services/mpiwg-mpdl-lt-web/WebContent/index.html @ 19:4a3641ae14d2

Erstellung
author Josef Willenborg <jwillenborg@mpiwg-berlin.mpg.de>
date Wed, 09 Nov 2011 15:32:05 +0100
parents
children 4ea0f81a5d08
comparison
equal deleted inserted replaced
18:dc5e9fcb3fdc 19:4a3641ae14d2
1 <!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0//EN">
2 <html>
3 <head>
4 <meta http-equiv="Content-Type" content="text/html; charset=utf-8">
5 <title>Max Planck Institute for the History of Science - Mpdl: Language technology services</title>
6 </head>
7 <body>
8 <table align="right">
9 <tr>
10 <td>
11 [<i>This software is dedicated to <a href="http://mpdl-proto.mpiwg-berlin.mpg.de/mpdl/info.xql?info=malcolm">Dr. Malcolm Hyman</a></i>]
12 <img src="/mpiwg-mpdl-lt-web/images/info.png" width="15" height="15" border="0" alt="Info"/><br/>
13 [<i>It is based on <a href="http://archimedes.fas.harvard.edu/">Donatus and Pollux</a></i>]
14 <img src="/mpiwg-mpdl-lt-web/images/info.png" width="15" height="15" border="0" alt="Info"/>
15 </td>
16 </tr>
17 </table>
18 <h2>Max Planck Institute for the History of Science - Mpdl: Language technology services</h2>
19 <ul>
20 <li><b>Url: /mpiwg-mpdl-lt-web/lt/GetDictionaryEntries</b>
21 <ul>
22 <li>Request parameters
23 <ul>
24 <li>query (required)
25 <ul>
26 <li>by one form or lemma (e.g. "revolution")</li>
27 <li>by a list of forms or lemmas (e.g. "revolution equality brotherliness")</li>
28 <li>by a prefix range: entries starting with a prefix (e.g. "a*")</li>
29 </ul>
30 </li>
31 <li>inputType (optional)
32 <ul>
33 <li>"form"</li>
34 <li>"lemma"</li>
35 <li>default: "form"</li>
36 </ul>
37 </li>
38 <li>language (optional)
39 <ul>
40 <li>ISO 639-3 specifier</li>
41 <li>default: "eng"</li>
42 </ul>
43 </li>
44 <li>dictionary (optional)
45 <ul>
46 <li>dictionary name, e.g. "webster"</li>
47 <li>default: "all" (all dictionaries for the specified language)</li>
48 </ul>
49 </li>
50 <li>outputType (optional)
51 <ul>
52 <li>"compact"</li>
53 <li>"full"</li>
54 <li>default: "compact"</li>
55 </ul>
56 </li>
57 <li>outputFormat (optional)
58 <ul>
59 <li>"html"</li>
60 <li>"xml"</li>
61 <li>default: "xml"</li>
62 </ul>
63 </li>
64 <li>normalization (optional)
65 <ul>
66 <li>"none"</li>
67 <li>"norm"</li>
68 <li>default: "norm"</li>
69 </ul>
70 </li>
71 <li>resultPage (optional)
72 <ul>
73 <li>works only for range queries</li>
74 <li>page number of the result (e.g. "2": result entries from position 51 to 100)</li>
75 <li>default: "1"</li>
76 </ul>
77 </li>
78 </ul>
79 </li>
80 <li>Response output
81 <ul>
82 <li>dependent of outputFormat, outputType and resultPage: morphology, dictionary and Wikipedia entries in Xml or Html format</li>
83 <li>Example: <a href="lt/GetDictionaryEntries?query=a*&dictionary=ls">query=a*&amp;dictionary=ls</a></li>
84 <li>Example: <a href="lt/GetDictionaryEntries?query=a*&language=lat&outputFormat=html">query=a*&amp;language=lat&amp;outputFormat=html</a></li>
85 <li>Example: <a href="lt/GetDictionaryEntries?query=revolution&language=eng">query=revolution&amp;language=lat</a></li>
86 <li>Example: <a href="lt/GetDictionaryEntries?query=multa&language=lat&outputFormat=html&outputType=full">query=multa&amp;language=lat&amp;outputFormat=html&amp;outputType=full</a></li>
87 </ul>
88 </li>
89 </ul>
90 </li>
91
92 <li><b>Url: /mpiwg-mpdl-lt-web/lt/GetLemmas</b>
93 <ul>
94 <li>Request parameters
95 <ul>
96 <li>query (required)
97 <ul>
98 <li>one form or lemma (e.g. "revolution") or</li>
99 <li>blank separated list of forms or lemmas (e.g. "revolution equality brotherliness")</li>
100 </ul>
101 </li>
102 <li>inputType (optional)
103 <ul>
104 <li>"form"</li>
105 <li>"lemma"</li>
106 <li>default: "form"</li>
107 </ul>
108 </li>
109 <li>language (optional)
110 <ul>
111 <li>ISO 639-3 specifier</li>
112 <li>default: "eng"</li>
113 </ul>
114 </li>
115 <li>outputType (optional)
116 <ul>
117 <li>"compact"</li>
118 <li>"full"</li>
119 <li>default: "compact"</li>
120 </ul>
121 </li>
122 <li>outputFormat (optional)
123 <ul>
124 <li>"html"</li>
125 <li>"xml"</li>
126 <li>"string" (lemma names separated by a blank)</li>
127 <li>default: "xml"</li>
128 </ul>
129 </li>
130 <li>normalization (optional)
131 <ul>
132 <li>"none"</li>
133 <li>"norm"</li>
134 <li>default: "norm"</li>
135 </ul>
136 </li>
137 </ul>
138 </li>
139 <li>Response output
140 <ul>
141 <li>dependent of outputFormat and outputType: lemma entries in Xml or Html or string format</li>
142 <li>Example: <a href="lt/GetLemmas?query=multa&language=lat&outputFormat=html">query=multa&amp;language=lat&amp;outputFormat=html</a></li>
143 </ul>
144 </li>
145 </ul>
146 </li>
147
148 <li><b>Url: /mpiwg-mpdl-lt-web/lt/GetForms</b>
149 <ul>
150 <li>Request parameters
151 <ul>
152 <li>query (required)
153 <ul>
154 <li>one lemma (e.g. "revolution") or</li>
155 <li>blank separated list of forms (e.g. "revolution equality brotherliness")</li>
156 </ul>
157 </li>
158 <li>language (optional)
159 <ul>
160 <li>ISO 639-3 specifier</li>
161 <li>default: "eng"</li>
162 </ul>
163 </li>
164 <li>outputType (optional)
165 <ul>
166 <li>"compact"</li>
167 <li>"full"</li>
168 <li>default: "compact"</li>
169 </ul>
170 </li>
171 <li>outputFormat (optional)
172 <ul>
173 <li>"html"</li>
174 <li>"xml"</li>
175 <li>"string" (lemma names separated by a blank)</li>
176 <li>default: "xml"</li>
177 </ul>
178 </li>
179 <li>normalization (optional)
180 <ul>
181 <li>"none"</li>
182 <li>"norm"</li>
183 <li>default: "norm"</li>
184 </ul>
185 </li>
186 </ul>
187 </li>
188 <li>Response output
189 <ul>
190 <li>dependent of outputFormat and outputType: form entries in Xml or Html or string format</li>
191 <li>Example: <a href="lt/GetForms?query=edo sum&language=lat&outputFormat=string">query=edo sum&amp;language=lat&amp;outputFormat=string</a></li>
192 </ul>
193 </li>
194 </ul>
195 </li>
196
197 <li><b>Url: /mpiwg-mpdl-lt-web/text/Tokenize</b>
198 <ul>
199 <li>Request parameters
200 <ul>
201 <li>inputString or srcUrl (required)
202 <ul>
203 <li>inputString
204 <ul>
205 <li>string which should be tokenized
206 <ul>
207 <li>unstructured text</li>
208 <li>XML fragment/document</li>
209 </ul>
210 </li>
211 </ul>
212 </li>
213 <li>srcUrl
214 <ul>
215 <li>source URL
216 <ul>
217 <li>unstructured text</li>
218 <li>XML fragment/document</li>
219 </ul>
220 </li>
221 </ul>
222 </li>
223 </ul>
224 </li>
225 <li>language (optional)
226 <ul>
227 <li>ISO 639-3 specifier</li>
228 <li>if input is XML and an element contains the attribute "xml:lang" this value is used for this element</li>
229 <li>default: "eng"</li>
230 </ul>
231 </li>
232 <li>normalization (optional)
233 <ul>
234 <li>"none"</li>
235 <li>"norm"</li>
236 <li>default: "norm"</li>
237 </ul>
238 </li>
239 <li>dictionary (optional)
240 <ul>
241 <li>"yes"</li>
242 <li>"no"</li>
243 <li>default: "yes"</li>
244 </ul>
245 </li>
246 <li>stopElements (optional)
247 <ul>
248 <li>list of xml element names which should not be tokenized (e.g. "var")</li>
249 <li>default: empty list</li>
250 </ul>
251 </li>
252 <li>outputFormat (optional)
253 <ul>
254 <li>"xml"</li>
255 <li>"string"</li>
256 <li>default: "xml"</li>
257 </ul>
258 </li>
259 <li>outputOptions (optional)
260 <ul>
261 <li>output options separated with blanks (e.g. "withForms withLemmas")
262 <ul>
263 <li>"withForms"</li>
264 <li>"withLemmas"</li>
265 <li>default: empty list</li>
266 </ul>
267 </li>
268 </ul>
269 </li>
270 </ul>
271 </li>
272 <li>Response output
273 <ul>
274 <li>outputFormat=xml
275 <ul>
276 <li>tokenized inputString or document (enriched by element &lt;w&gt;)
277 <ul>
278 <li>Example: &lt;s&gt;&lt;w lang="deu" form="dies" forms="dies, dieser, dieses, diesen" lemmas="dieser"&gt;Dies&lt;/w&gt; &lt;w
279 lang="deu" form="ist" forms="bin, bist, ist, seid, sind, sein, war, warst, wart" lemmas="sein"&gt;ist&lt;/w&gt; &lt;w
280 lang="deu" form="ein" forms="ein, eines, einer" lemmas="ein"&gt;ein&lt;/w&gt; &lt;w lang="deu" form="satz"
281 forms="satz, sätze, satzes" lemmas="satz"&gt;Satz&lt;/w&gt;&lt;/s&gt;
282 </li>
283 </ul>
284 </li>
285 </ul>
286 <li>outputFormat=string
287 <ul>
288 <li>word tokens of inputString or document (separated by Blank)</li>
289 </ul>
290 <li>Example: <a href="text/Tokenize?inputString=edo sum philoſophi&language=lat&outputFormat=xml">inputString=edo sum philoſophi&amp;language=lat&amp;outputFormat=xml</a></li>
291 <li>Example: <a href="text/Tokenize?srcUrl=http://mpdl-system.mpiwg-berlin.mpg.de/mpdl/page-query-result.xql?document=/echo/la/Benedetti_1585.xml%26mode=pureXml%26pn=13&language=lat">srcUrl=http://mpdl-system.mpiwg-berlin.mpg.de/mpdl/page-query-result.xql?document=/echo/la/Benedetti_1585.xml%26mode=pureXml%26pn=13&amp;language=lat</a></li>
292 <li>Example: <a href="text/Tokenize?srcUrl=http://mpdl-system.mpiwg-berlin.mpg.de/mpdl/page-query-result.xql?document=/echo/la/Benedetti_1585.xml%26mode=pureXml%26pn=13&language=lat&outputOptions=withForms withLemmas">srcUrl=http://mpdl-system.mpiwg-berlin.mpg.de/mpdl/page-query-result.xql?document=/echo/la/Benedetti_1585.xml%26mode=pureXml%26pn=13&amp;language=lat&amp;outputOptions=withForms withLemmas</a></li>
293 </ul>
294 </li>
295 </ul>
296 </li>
297
298 <li><b>Url: /mpiwg-mpdl-lt-web/text/Normalize</b>
299 <ul>
300 <li>Request parameters
301 <ul>
302 <li>inputString (required)
303 <ul>
304 <li>string which should be normalized</li>
305 </ul>
306 </li>
307 <li>language (optional)
308 <ul>
309 <li>ISO 639-3 specifier</li>
310 <li>default: "eng"</li>
311 </ul>
312 </li>
313 <li>type (optional)
314 <ul>
315 <li>"dictionary"</li>
316 <li>"display"</li>
317 <li>default: "display"</li>
318 </ul>
319 </li>
320 </ul>
321 </li>
322 <li>Response output
323 <ul>
324 <li>normalized string</li>
325 <li>Example: <a href="text/Normalize?inputString=philoſophi&language=lat">inputString=philoſophi&amp;language=lat</a></li>
326 </ul>
327 </li>
328 </ul>
329 </li>
330
331 <li><b>Url: /mpiwg-mpdl-lt-web/text/Transcode</b>
332 <ul>
333 <li>Request parameters
334 <ul>
335 <li>inputString (required)
336 <ul>
337 <li>string which should be transcoded</li>
338 </ul>
339 </li>
340 <li>srcEncoding (required)
341 <ul>
342 <li>"betacode"</li>
343 <li>"buckwalter"</li>
344 <li>"unicode"</li>
345 </ul>
346 </li>
347 <li>destEncoding (optional)
348 <ul>
349 <li>"betacode"</li>
350 <li>"buckwalter"</li>
351 <li>"unicode"</li>
352 <li>default: "unicode"</li>
353 </ul>
354 </li>
355 </ul>
356 </li>
357 <li>Response output
358 <ul>
359 <li>transcoded string</li>
360 <li>Example: <a href="text/Transcode?inputString=kai/&srcEncoding=betacode&destEncoding=unicode">inputString=kai/&amp;srcEncoding=betacode&amp;destEncoding=unicode</a></li>
361 </ul>
362 </li>
363 </ul>
364 </li>
365 </ul>
366
367 </body>
368 </html>
369
370