view software/mpdl-services/mpiwg-mpdl-lt-web/WebContent/index.html @ 19:4a3641ae14d2

Erstellung
author Josef Willenborg <jwillenborg@mpiwg-berlin.mpg.de>
date Wed, 09 Nov 2011 15:32:05 +0100
parents
children 4ea0f81a5d08
line wrap: on
line source

<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0//EN">
<html>
<head>
<meta http-equiv="Content-Type" content="text/html; charset=utf-8">
<title>Max Planck Institute for the History of Science - Mpdl: Language technology services</title>
</head>
<body>
<table align="right">
<tr>
<td>
  [<i>This software is dedicated to <a href="http://mpdl-proto.mpiwg-berlin.mpg.de/mpdl/info.xql?info=malcolm">Dr. Malcolm Hyman</a></i>]
  <img src="/mpiwg-mpdl-lt-web/images/info.png" width="15" height="15" border="0" alt="Info"/><br/>
  [<i>It is based on <a href="http://archimedes.fas.harvard.edu/">Donatus and Pollux</a></i>] 
  <img src="/mpiwg-mpdl-lt-web/images/info.png" width="15" height="15" border="0" alt="Info"/>
</td>
</tr>
</table>
<h2>Max Planck Institute for the History of Science - Mpdl: Language technology services</h2>
<ul>
  <li><b>Url: /mpiwg-mpdl-lt-web/lt/GetDictionaryEntries</b>
    <ul>
      <li>Request parameters
        <ul>
          <li>query (required)
              <ul>
                <li>by one form or lemma (e.g. "revolution")</li>
                <li>by a list of forms or lemmas (e.g. "revolution equality brotherliness")</li>
                <li>by a prefix range: entries starting with a prefix (e.g. "a*")</li>
             </ul>
          </li>
          <li>inputType (optional)
            <ul>
              <li>"form"</li>
              <li>"lemma"</li>
              <li>default: "form"</li>
            </ul>
          </li>
          <li>language (optional)
            <ul>
              <li>ISO 639-3 specifier</li>
              <li>default: "eng"</li>
            </ul>
          </li>
          <li>dictionary (optional)
            <ul>
              <li>dictionary name, e.g. "webster"</li>
              <li>default: "all" (all dictionaries for the specified language)</li>
            </ul>
          </li>
          <li>outputType (optional)
            <ul>
              <li>"compact"</li>
              <li>"full"</li>
              <li>default: "compact"</li>
            </ul>
          </li>
          <li>outputFormat (optional)
            <ul>
              <li>"html"</li>
              <li>"xml"</li>
              <li>default: "xml"</li>
            </ul>
          </li>
          <li>normalization (optional)
            <ul>
              <li>"none"</li>
              <li>"norm"</li>
              <li>default: "norm"</li>
            </ul>
          </li>
          <li>resultPage (optional)
            <ul>
              <li>works only for range queries</li>
              <li>page number of the result (e.g. "2": result entries from position 51 to 100)</li>
              <li>default: "1"</li>
            </ul>
          </li>
        </ul>
      </li>
      <li>Response output
        <ul>
          <li>dependent of outputFormat, outputType and resultPage: morphology, dictionary and Wikipedia entries in Xml or Html format</li>
          <li>Example: <a href="lt/GetDictionaryEntries?query=a*&dictionary=ls">query=a*&amp;dictionary=ls</a></li>
          <li>Example: <a href="lt/GetDictionaryEntries?query=a*&language=lat&outputFormat=html">query=a*&amp;language=lat&amp;outputFormat=html</a></li>
          <li>Example: <a href="lt/GetDictionaryEntries?query=revolution&language=eng">query=revolution&amp;language=lat</a></li>
          <li>Example: <a href="lt/GetDictionaryEntries?query=multa&language=lat&outputFormat=html&outputType=full">query=multa&amp;language=lat&amp;outputFormat=html&amp;outputType=full</a></li>
        </ul>
      </li>
    </ul>
  </li>

  <li><b>Url: /mpiwg-mpdl-lt-web/lt/GetLemmas</b>
    <ul>
      <li>Request parameters
        <ul>
          <li>query (required)
              <ul>
                <li>one form or lemma (e.g. "revolution") or</li>
                <li>blank separated list of forms or lemmas (e.g. "revolution equality brotherliness")</li>
             </ul>
          </li>
          <li>inputType (optional)
            <ul>
              <li>"form"</li>
              <li>"lemma"</li>
              <li>default: "form"</li>
            </ul>
          </li>
          <li>language (optional)
            <ul>
              <li>ISO 639-3 specifier</li>
              <li>default: "eng"</li>
            </ul>
          </li>
          <li>outputType (optional)
            <ul>
              <li>"compact"</li>
              <li>"full"</li>
              <li>default: "compact"</li>
            </ul>
          </li>
          <li>outputFormat (optional)
            <ul>
              <li>"html"</li>
              <li>"xml"</li>
              <li>"string" (lemma names separated by a blank)</li>
              <li>default: "xml"</li>
            </ul>
          </li>
          <li>normalization (optional)
            <ul>
              <li>"none"</li>
              <li>"norm"</li>
              <li>default: "norm"</li>
            </ul>
          </li>
        </ul>
      </li>
      <li>Response output
        <ul>
          <li>dependent of outputFormat and outputType: lemma entries in Xml or Html or string format</li>
          <li>Example: <a href="lt/GetLemmas?query=multa&language=lat&outputFormat=html">query=multa&amp;language=lat&amp;outputFormat=html</a></li>
        </ul>
      </li>
    </ul>
  </li>

  <li><b>Url: /mpiwg-mpdl-lt-web/lt/GetForms</b>
    <ul>
      <li>Request parameters
        <ul>
          <li>query (required)
              <ul>
                <li>one lemma (e.g. "revolution") or</li>
                <li>blank separated list of forms (e.g. "revolution equality brotherliness")</li>
             </ul>
          </li>
          <li>language (optional)
            <ul>
              <li>ISO 639-3 specifier</li>
              <li>default: "eng"</li>
            </ul>
          </li>
          <li>outputType (optional)
            <ul>
              <li>"compact"</li>
              <li>"full"</li>
              <li>default: "compact"</li>
            </ul>
          </li>
          <li>outputFormat (optional)
            <ul>
              <li>"html"</li>
              <li>"xml"</li>
              <li>"string" (lemma names separated by a blank)</li>
              <li>default: "xml"</li>
            </ul>
          </li>
          <li>normalization (optional)
            <ul>
              <li>"none"</li>
              <li>"norm"</li>
              <li>default: "norm"</li>
            </ul>
          </li>
        </ul>
      </li>
      <li>Response output
        <ul>
          <li>dependent of outputFormat and outputType: form entries in Xml or Html or string format</li>
          <li>Example: <a href="lt/GetForms?query=edo sum&language=lat&outputFormat=string">query=edo sum&amp;language=lat&amp;outputFormat=string</a></li>
        </ul>
      </li>
    </ul>
  </li>

  <li><b>Url: /mpiwg-mpdl-lt-web/text/Tokenize</b>
    <ul>
      <li>Request parameters
        <ul>
          <li>inputString or srcUrl (required)
            <ul>
              <li>inputString
                <ul>
                  <li>string which should be tokenized
                    <ul>
                      <li>unstructured text</li>
                      <li>XML fragment/document</li>
                    </ul>
                  </li>
                </ul>
              </li>
              <li>srcUrl
                <ul>
                  <li>source URL
                    <ul>
                      <li>unstructured text</li>
                      <li>XML fragment/document</li>
                    </ul>
                  </li>
                </ul>
              </li>
            </ul>
          </li>
          <li>language (optional)
            <ul>
              <li>ISO 639-3 specifier</li>
              <li>if input is XML and an element contains the attribute "xml:lang" this value is used for this element</li>
              <li>default: "eng"</li>
            </ul>
          </li>
          <li>normalization (optional)
            <ul>
              <li>"none"</li>
              <li>"norm"</li>
              <li>default: "norm"</li>
            </ul>
          </li>
          <li>dictionary (optional)
            <ul>
              <li>"yes"</li>
              <li>"no"</li>
              <li>default: "yes"</li>
            </ul>
          </li>
          <li>stopElements (optional)
            <ul>
              <li>list of xml element names which should not be tokenized (e.g. "var")</li>
              <li>default: empty list</li>
            </ul>
          </li>
          <li>outputFormat (optional)
            <ul>
              <li>"xml"</li>
              <li>"string"</li>
              <li>default: "xml"</li>
            </ul>
          </li>
          <li>outputOptions (optional)
            <ul>
              <li>output options separated with blanks (e.g. "withForms withLemmas")
                <ul>
                  <li>"withForms"</li>
                  <li>"withLemmas"</li>
                  <li>default: empty list</li>
                </ul>
              </li>
            </ul>
          </li>
        </ul>
      </li>
      <li>Response output
        <ul>
          <li>outputFormat=xml
            <ul>
              <li>tokenized inputString or document (enriched by element &lt;w&gt;)
                <ul>
                  <li>Example: &lt;s&gt;&lt;w lang="deu" form="dies" forms="dies, dieser, dieses, diesen" lemmas="dieser"&gt;Dies&lt;/w&gt; &lt;w 
                  lang="deu" form="ist" forms="bin, bist, ist, seid, sind, sein, war, warst, wart" lemmas="sein"&gt;ist&lt;/w&gt; &lt;w 
                  lang="deu" form="ein" forms="ein, eines, einer" lemmas="ein"&gt;ein&lt;/w&gt; &lt;w lang="deu" form="satz" 
                  forms="satz, sätze, satzes" lemmas="satz"&gt;Satz&lt;/w&gt;&lt;/s&gt;
                  </li>
                </ul>
              </li>
            </ul>
          <li>outputFormat=string
            <ul>
              <li>word tokens of inputString or document (separated by Blank)</li>
            </ul> 
          <li>Example: <a href="text/Tokenize?inputString=edo sum philoſophi&language=lat&outputFormat=xml">inputString=edo sum philoſophi&amp;language=lat&amp;outputFormat=xml</a></li>
          <li>Example: <a href="text/Tokenize?srcUrl=http://mpdl-system.mpiwg-berlin.mpg.de/mpdl/page-query-result.xql?document=/echo/la/Benedetti_1585.xml%26mode=pureXml%26pn=13&language=lat">srcUrl=http://mpdl-system.mpiwg-berlin.mpg.de/mpdl/page-query-result.xql?document=/echo/la/Benedetti_1585.xml%26mode=pureXml%26pn=13&amp;language=lat</a></li>
          <li>Example: <a href="text/Tokenize?srcUrl=http://mpdl-system.mpiwg-berlin.mpg.de/mpdl/page-query-result.xql?document=/echo/la/Benedetti_1585.xml%26mode=pureXml%26pn=13&language=lat&outputOptions=withForms withLemmas">srcUrl=http://mpdl-system.mpiwg-berlin.mpg.de/mpdl/page-query-result.xql?document=/echo/la/Benedetti_1585.xml%26mode=pureXml%26pn=13&amp;language=lat&amp;outputOptions=withForms withLemmas</a></li>
        </ul>
      </li>
    </ul>
  </li>

  <li><b>Url: /mpiwg-mpdl-lt-web/text/Normalize</b>
    <ul>
      <li>Request parameters
        <ul>
          <li>inputString (required)
            <ul>
              <li>string which should be normalized</li>
            </ul>
          </li>
          <li>language (optional)
            <ul>
              <li>ISO 639-3 specifier</li>
              <li>default: "eng"</li>
            </ul>
          </li>
          <li>type (optional)
            <ul>
              <li>"dictionary"</li>
              <li>"display"</li>
              <li>default: "display"</li>
            </ul>
          </li>
        </ul>
      </li>
      <li>Response output
        <ul>
          <li>normalized string</li>
          <li>Example: <a href="text/Normalize?inputString=philoſophi&language=lat">inputString=philoſophi&amp;language=lat</a></li>
        </ul>
      </li>
    </ul>
  </li>

  <li><b>Url: /mpiwg-mpdl-lt-web/text/Transcode</b>
    <ul>
      <li>Request parameters
        <ul>
          <li>inputString (required)
            <ul>
              <li>string which should be transcoded</li>
            </ul>
          </li>
          <li>srcEncoding (required)
            <ul>
              <li>"betacode"</li>
              <li>"buckwalter"</li>
              <li>"unicode"</li>
            </ul>
          </li>
          <li>destEncoding (optional)
            <ul>
              <li>"betacode"</li>
              <li>"buckwalter"</li>
              <li>"unicode"</li>
              <li>default: "unicode"</li>
            </ul>
          </li>
        </ul>
      </li>
      <li>Response output
        <ul>
          <li>transcoded string</li>
          <li>Example: <a href="text/Transcode?inputString=kai/&srcEncoding=betacode&destEncoding=unicode">inputString=kai/&amp;srcEncoding=betacode&amp;destEncoding=unicode</a></li>
        </ul>
      </li>
    </ul>
  </li>
</ul>   
 
</body>
</html>