0
|
1 """Utility methods for handling XML, reading HTTP, etc"""
|
|
2
|
|
3 import sys
|
|
4 import urllib
|
|
5 import urllib2
|
|
6 import logging
|
|
7
|
|
8
|
12
|
9 srvTxtUtilsVersion = "1.2"
|
0
|
10
|
|
11 def getInt(number, default=0):
|
|
12 """returns always an int (0 in case of problems)"""
|
|
13 try:
|
|
14 return int(number)
|
|
15 except:
|
|
16 return int(default)
|
|
17
|
1
|
18 def getAt(array, idx, default=None):
|
|
19 """returns element idx from array or default (in case of problems)"""
|
|
20 try:
|
|
21 return array[idx]
|
|
22 except:
|
|
23 return default
|
|
24
|
12
|
25 def getText(node, recursive=0):
|
0
|
26 """returns all text content of a node and its subnodes"""
|
|
27 if node is None:
|
12
|
28 return ''
|
|
29
|
0
|
30 # ElementTree:
|
12
|
31 text = node.text or ''
|
0
|
32 for e in node:
|
12
|
33 if recursive:
|
|
34 text += getText(e)
|
|
35 else:
|
|
36 text += e.text or ''
|
0
|
37 if e.tail:
|
|
38 text += e.tail
|
|
39
|
|
40 # 4Suite:
|
|
41 #nodelist=node.childNodes
|
|
42 #text = ""
|
|
43 #for n in nodelist:
|
|
44 # if n.nodeType == node.TEXT_NODE:
|
|
45 # text = text + n.data
|
|
46
|
|
47 return text
|
|
48
|
|
49
|
|
50
|
|
51 def getHttpData(url, data=None, num_tries=3, timeout=10):
|
|
52 """returns result from url+data HTTP request"""
|
|
53 # we do GET (by appending data to url)
|
|
54 if isinstance(data, str) or isinstance(data, unicode):
|
|
55 # if data is string then append
|
|
56 url = "%s?%s"%(url,data)
|
|
57 elif isinstance(data, dict) or isinstance(data, list) or isinstance(data, tuple):
|
|
58 # urlencode
|
|
59 url = "%s?%s"%(url,urllib.urlencode(data))
|
|
60
|
|
61 response = None
|
|
62 errmsg = None
|
|
63 for cnt in range(num_tries):
|
|
64 try:
|
|
65 logging.debug("getHttpData(#%s %ss) url=%s"%(cnt+1,timeout,url))
|
|
66 if sys.version_info < (2, 6):
|
|
67 # set timeout on socket -- ugly :-(
|
|
68 import socket
|
|
69 socket.setdefaulttimeout(float(timeout))
|
|
70 response = urllib2.urlopen(url)
|
|
71 else:
|
|
72 # timeout as parameter
|
|
73 response = urllib2.urlopen(url,timeout=float(timeout))
|
|
74 # check result?
|
|
75 break
|
|
76 except urllib2.HTTPError, e:
|
|
77 logging.error("getHttpData: HTTP error(%s): %s"%(e.code,e))
|
|
78 errmsg = str(e)
|
|
79 # stop trying
|
|
80 break
|
|
81 except urllib2.URLError, e:
|
|
82 logging.error("getHttpData: URLLIB error(%s): %s"%(e.reason,e))
|
|
83 errmsg = str(e)
|
|
84 # stop trying
|
|
85 #break
|
|
86
|
|
87 if response is not None:
|
|
88 data = response.read()
|
|
89 response.close()
|
|
90 return data
|
|
91
|
|
92 raise IOError("ERROR fetching HTTP data from %s: %s"%(url,errmsg))
|
|
93 #return None
|
|
94
|