--- OSAS/OSA_system/OSAS_helpers.py 2004/01/06 14:39:49 1.2 +++ OSAS/OSA_system/OSAS_helpers.py 2004/04/14 21:38:02 1.6 @@ -2,6 +2,34 @@ import xml.dom.minidom import os.path import re +import urllib + + +def readArchimedesXML(folder): + """gib URL aus """ + try: + XML=urllib.urlopen("http://archimedes.mpiwg-berlin.mpg.de/cgi-bin/toc/toc.cgi?step=xmlcorpusmanifest").read() + #print XML + dom=xml.dom.minidom.parseString(XML) + items=dom.getElementsByTagName('item') + dict={} + + for item in items: + #print item.attributes['dir'].value + try: + dict[item.attributes['dir'].value]=item.attributes['xml'].value + #print item.attributes['dir'].value,item.attributes['text'].value + except: + """nothing""" + + if dict.has_key(folder): + return dict[folder] + else: + return "" + except: + return "" + + def getText(nodelist): @@ -43,13 +71,15 @@ def changeNodesInIndexMeta(path,node,sub for subnode in subnodes.keys(): nodeOld=root.getElementsByTagName(subnode) - + if nodeOld: # if yes -> delete it - root.removeChild(nodeOld[0]).unlink() - + try: + root.removeChild(nodeOld[0]).unlink() + except: + """nothing""" namenode=dom.createElement(re.sub(r' ','-',subnode)) - namenodetext=dom.createTextNode(subnodes[subnode].decode("utf8")) + namenodetext=dom.createTextNode(unicode(subnodes[subnode],"utf8")) namenode.appendChild(namenodetext) root.appendChild(namenode) @@ -69,7 +99,7 @@ def changeNodesInIndexMeta(path,node,sub for subnode in subnodes.keys(): namenode=dom.createElement(re.sub(r' ','-',subnode)) - namenodetext=dom.createTextNode(subnodes[subnode].decode("utf8")) + namenodetext=dom.createTextNode(unicode(subnodes[subnode],"utf8")) namenode.appendChild(namenodetext) nodeNew.appendChild(namenode)