annotate importFromOpenMind/importer/filterISMI.py @ 10:2a786f0d46a7

more comments in the code.
author casties
date Fri, 26 Jun 2015 10:59:53 +0200
parents 0ae6145e7c80
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
1 '''
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
2 Created on 22.04.2014
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
3
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
4 @author: dwinter
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
5 '''
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
6
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
7 import os
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
8 import json
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
9 import urllib.request
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
10
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
11 class Importer:
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
12
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
13 def loadJSON(self,url):
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
14 """Load JSON from URL.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
15
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
16 Saves JSON in data member.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
17 """
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
18 print(" loading "+url)
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
19 response = urllib.request.urlopen(url)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
20 str_response = response.readall().decode('utf-8')
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
21
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
22 self.data = json.loads(str_response)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
23
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
24
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
25 def loadJSONFromFile(self,fn):
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
26 """Load JSON from file.
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
27
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
28 Saves JSON in data member.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
29 """
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
30 print(" loading "+fn+".json")
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
31 self.data = json.load(open(fn+".json",'r', encoding="utf-8"),encoding="utf-8")
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
32
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
33
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
34 def getEntIdsMentioned(self,kind="tar",filterOC=[]):
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
35 """Extract related entities from data member.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
36
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
37 Checks relations of direction kind.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
38 Skips objects of type filterOC.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
39 Returns a set of ids of related objects and a list of the relations.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
40 """
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
41
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
42 ents = self.data.get("ents")
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
43
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
44 ret=set()
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
45 rels=[]
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
46 if kind=="tar":
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
47 rel_type="tar_rels"
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
48 id_type="src_id"
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
49 oc_type="src_oc"
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
50 else:
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
51 rel_type="src_rels"
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
52 id_type="tar_id"
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
53 oc_type="tar_oc"
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
54
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
55 for ent in ents:
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
56 tar_rels = ent.get(rel_type)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
57
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
58 for tar_rel in tar_rels:
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
59
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
60 if not tar_rel.get(oc_type) in filterOC:
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
61
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
62 ret.add(str(tar_rel.get(id_type)))
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
63
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
64 rels.append(tar_rel)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
65
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
66 return ret,rels
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
67
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
68
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
69 def loadallEnts(self,kind="tar",filterOC=[]):
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
70 """Get related entities from OpenMind.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
71
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
72 Gets all related entities' ids using kind and filterOC via getEntIdsMentioned().
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
73 Downloads the entities from OpenMind using the ids.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
74 Returns the entities as JSON-string and a list of relations.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
75 """
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
76
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
77 ids,rels = self.getEntIdsMentioned(kind=kind,filterOC=filterOC)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
78
4
0ae6145e7c80 update urls.
root@ismi.rz-berlin.mpg.de
parents: 2
diff changeset
79 baseUrl="https://ismi.mpiwg-berlin.mpg.de/om4-ismi/jsonInterface?include_content=true&include_romanization=true&method=get_ents"
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
80
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
81 lenId = len(ids)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
82
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
83 portions = int(lenId / 500)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
84
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
85 ents = []
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
86 for p in range(portions+1):
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
87
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
88 start = p * 500
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
89 end = min(lenId,(p+1)*500)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
90
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
91 idsFrak = list(ids)[start:end]
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
92 idsString = ",".join(idsFrak)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
93
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
94
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
95 qs = baseUrl+"&ids="+idsString
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
96 print(" loading ents from "+qs)
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
97 response = urllib.request.urlopen(qs)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
98 entsJ = json.loads(response.readall().decode('utf-8'));
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
99 ents += entsJ.get("ents")
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
100 #str_response += response.readall().decode('utf-8')
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
101
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
102 str_response = json.dumps({"ents":ents});
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
103 return str_response,rels
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
104
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
105
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
106 def saveallEnts(self,filename,kind="tar",filterOC=[]):
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
107 """Loads all related entities and saves as JSON.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
108
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
109 Loads all related entities using kind and filterOC via LoadAllEnts().
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
110 Saves entities in file filename.json.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
111 Saves relations in file filename_rels.json.
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
112 """
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
113
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
114 ents,rels = self.loadallEnts(kind=kind,filterOC=filterOC)
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
115
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
116 print(" writing ", filename+".json")
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
117 of = open(filename+".json","wb")
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
118 of.write(ents.encode('utf-8'))
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
119 of.close()
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
120
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
121 print(" writing ", filename+"_rels.json")
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
122 of = open(filename+"_rels.json","w")
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
123 json.dump({'rels':rels},of);
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
124 of.close()
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
125
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
126
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
127 if __name__ == '__main__':
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
128 imp = Importer()
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
129
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
130 # url = """http://openmind-ismi-dev.mpiwg-berlin.mpg.de/om4-ismi/jsonInterface?method=get_ents&ids=27543,36745,58453,87298,259646,35093,22863,34870,36882,101488,36696,31794,37240,35014,35583,37025,35960,172492,98286,165721,260111,90980,36316,260120,36241,260129,260138,38860,176694,72545,36185,36575,260146,31672,37739,89861,176778,180743,86328,260150,90658,58423,181058,105948,35526,74078,260158,181096,31606,31568,27872,36938,4836,34668,76866,102230,76888,74070,73757,182685,260162,260170,1102,172888,260174,34806,28088,36713,37323,34551,35943,98095,260178,260182,182770,260186,260190,260194,36114,85003,31630,157290,37153,37213,172952,86871,64406,102590,82615,58245,179791,179550,12419,95861,36429,36099,74237,36065,74822,87549,83765,36733,19259,260198,34986,88041,260202,36550,260206,37228,39880,36318,36597,35035,58328,80831,58354,74277,36529,36380,69450,200246,260222,81178,260226,199952,262557,87212,99059,64270,81811,65785,36645
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
131 # """
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
132 #
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
133 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
134 # load all public codices
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
135 # contains codices with attributes and first-order relations
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
136 #
4
0ae6145e7c80 update urls.
root@ismi.rz-berlin.mpg.de
parents: 2
diff changeset
137 url = """https://ismi.mpiwg-berlin.mpg.de/om4-ismi/jsonInterface?method=get_public_codices"""
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
138
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
139 imp.loadJSON(url)
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
140
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
141 # create directory for export files
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
142 exportDir = '/tmp/ismi_data'
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
143 if not os.access(exportDir, os.R_OK):
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
144 # dir doesn't exist -> create
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
145 os.makedirs(exportDir)
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
146
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
147 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
148 # load and save all target relations of codices as witnesses.json
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
149 #
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
150 imp.saveallEnts(exportDir+"/witnesses",kind="tar")
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
151
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
152 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
153 # load and save all source relations of codices except type codex and witness as codex_src.json
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
154 #
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
155 imp.saveallEnts(exportDir+"/codex_src",kind="src",filterOC=['CODEX','WITNESS'])
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
156
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
157 #hole jetzt alle relationen an den witnessen
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
158
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
159 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
160 # load the witnesses.json file from above
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
161 #
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
162 imp.loadJSONFromFile(exportDir+"/witnesses")
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
163
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
164 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
165 # load and save all source relations except type codex, witness, person as texts.json
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
166 #
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
167 imp.saveallEnts(exportDir+"/texts",kind="src",filterOC=['CODEX','WITNESS','PERSON'])
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
168
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
169 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
170 # load the texts.json file from above
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
171 #
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
172 imp.loadJSONFromFile(exportDir+"/texts")
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
173
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
174 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
175 # load and save all source relations except type codex, witness and text as authors_subjects_src.json
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
176 #
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
177 imp.saveallEnts(exportDir+"/authors_subjects_src",kind="src",filterOC=['CODEX','WITNESS','TEXT'])
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
178
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
179 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
180 # load and save all target relations except type codex, witness and text as authors_subjects_tar.json
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
181 #
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
182 imp.saveallEnts(exportDir+"/authors_subjects_tar",kind="tar",filterOC=['CODEX','WITNESS','TEXT'])
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
183
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
184 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
185 # load the authors_subjects_src.json file from above
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
186 #
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
187 imp.loadJSONFromFile(exportDir+"/authors_subjects_src")
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
188
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
189 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
190 # load and save all source relations except type codex, witness, text and person as subjects_places.json
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
191 #
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
192 imp.saveallEnts(exportDir+"/subjects_places",kind="src",filterOC=['CODEX','WITNESS','TEXT','PERSON'])
10
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
193
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
194 #
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
195 # load and save all source relations of type codex, witness, text and person as references_places.json
2a786f0d46a7 more comments in the code.
casties
parents: 4
diff changeset
196 #
2
e55656794c82 create and use separate export directory.
root@ismi.rz-berlin.mpg.de
parents: 0
diff changeset
197 imp.saveallEnts(exportDir+"/references_places",kind="tar",filterOC=['CODEX','WITNESS','TEXT','PERSON'])
0
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
198
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
199
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
200
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
201
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
202
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
203
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
204
124ef8f3b22d initial
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents:
diff changeset
205